mirror of
https://github.com/DS4SD/docling.git
synced 2025-07-26 12:04:31 +00:00
1 line
5.2 MiB
1 line
5.2 MiB
[{"page_no": 0, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.301, "r_y0": 119.93100000000004, "r_x1": 498.927, "r_y1": 119.93100000000004, "r_x2": 498.927, "r_y2": 107.03399999999999, "r_x3": 96.301, "r_y3": 107.03399999999999, "coord_origin": "TOPLEFT"}, "text": "TableFormer: Table Structure Understanding with Transformers.", "orig": "TableFormer: Table Structure Understanding with Transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.477, "r_y0": 157.26999999999998, "r_x1": 452.75, "r_y1": 157.26999999999998, "r_x2": 452.75, "r_y2": 147.00800000000004, "r_x3": 142.477, "r_y3": 147.00800000000004, "coord_origin": "TOPLEFT"}, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.918, "r_y0": 171.21699999999998, "r_x1": 332.306, "r_y1": 171.21699999999998, "r_x2": 332.306, "r_y2": 160.95500000000004, "r_x3": 262.918, "r_y3": 160.95500000000004, "coord_origin": "TOPLEFT"}, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.123, "r_y0": 184.26999999999998, "r_x1": 212.731, "r_y1": 184.26999999999998, "r_x2": 212.731, "r_y2": 176.562, "r_x3": 208.123, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.73, "r_y0": 183.861, "r_x1": 378.733, "r_y1": 183.861, "r_x2": 378.733, "r_y2": 177.692, "r_x3": 212.73, "r_y3": 177.692, "coord_origin": "TOPLEFT"}, "text": "ahn,nli,mly,taa @zurich.ibm.com", "orig": "ahn,nli,mly,taa @zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.428, "r_y0": 184.26999999999998, "r_x1": 298.036, "r_y1": 184.26999999999998, "r_x2": 298.036, "r_y2": 176.562, "r_x3": 293.428, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.995, "r_y0": 226.231, "r_x1": 190.48, "r_y1": 226.231, "r_x2": 190.48, "r_y2": 215.48299999999995, "r_x3": 145.995, "r_y3": 215.48299999999995, "coord_origin": "TOPLEFT"}, "text": "Abstract", "orig": "Abstract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 249.98299999999995, "r_x1": 286.365, "r_y1": 249.98299999999995, "r_x2": 286.365, "r_y2": 241.39499999999998, "r_x3": 62.067, "r_y3": 241.39499999999998, "coord_origin": "TOPLEFT"}, "text": "Tables organize valuable content in a concise and com-", "orig": "Tables organize valuable content in a concise and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 261.938, "r_x1": 130.062, "r_y1": 261.938, "r_x2": 130.062, "r_y2": 253.35000000000002, "r_x3": 50.112, "r_y3": 253.35000000000002, "coord_origin": "TOPLEFT"}, "text": "pact representation.", "orig": "pact representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.475, "r_y0": 261.938, "r_x1": 286.365, "r_y1": 261.938, "r_x2": 286.365, "r_y2": 253.35000000000002, "r_x3": 134.475, "r_y3": 253.35000000000002, "coord_origin": "TOPLEFT"}, "text": "This content is extremely valuable for", "orig": "This content is extremely valuable for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 273.89300000000003, "r_x1": 286.365, "r_y1": 273.89300000000003, "r_x2": 286.365, "r_y2": 265.30499999999995, "r_x3": 50.112, "r_y3": 265.30499999999995, "coord_origin": "TOPLEFT"}, "text": "systems such as search engines, Knowledge Graph's, etc,", "orig": "systems such as search engines, Knowledge Graph's, etc,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 285.849, "r_x1": 245.18, "r_y1": 285.849, "r_x2": 245.18, "r_y2": 277.26099999999997, "r_x3": 50.112, "r_y3": 277.26099999999997, "coord_origin": "TOPLEFT"}, "text": "since they enhance their predictive capabilities.", "orig": "since they enhance their predictive capabilities.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.496, "r_y0": 285.849, "r_x1": 286.365, "r_y1": 285.849, "r_x2": 286.365, "r_y2": 277.26099999999997, "r_x3": 251.496, "r_y3": 277.26099999999997, "coord_origin": "TOPLEFT"}, "text": "Unfortu-", "orig": "Unfortu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 297.804, "r_x1": 286.365, "r_y1": 297.804, "r_x2": 286.365, "r_y2": 289.216, "r_x3": 50.112, "r_y3": 289.216, "coord_origin": "TOPLEFT"}, "text": "nately, tables come in a large variety of shapes and sizes.", "orig": "nately, tables come in a large variety of shapes and sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 309.759, "r_x1": 103.601, "r_y1": 309.759, "r_x2": 103.601, "r_y2": 301.171, "r_x3": 50.112, "r_y3": 301.171, "coord_origin": "TOPLEFT"}, "text": "Furthermore,", "orig": "Furthermore,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 108.393, "r_y0": 309.759, "r_x1": 124.692, "r_y1": 309.759, "r_x2": 124.692, "r_y2": 301.171, "r_x3": 108.393, "r_y3": 301.171, "coord_origin": "TOPLEFT"}, "text": "they", "orig": "they", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.026, "r_y0": 309.759, "r_x1": 286.365, "r_y1": 309.759, "r_x2": 286.365, "r_y2": 301.171, "r_x3": 129.026, "r_y3": 301.171, "coord_origin": "TOPLEFT"}, "text": "can have complex column/row-header", "orig": "can have complex column/row-header", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 321.714, "r_x1": 286.365, "r_y1": 321.714, "r_x2": 286.365, "r_y2": 313.126, "r_x3": 50.112, "r_y3": 313.126, "coord_origin": "TOPLEFT"}, "text": "configurations, multiline rows, different variety of separa-", "orig": "configurations, multiline rows, different variety of separa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 333.669, "r_x1": 175.123, "r_y1": 333.669, "r_x2": 175.123, "r_y2": 325.081, "r_x3": 50.112, "r_y3": 325.081, "coord_origin": "TOPLEFT"}, "text": "tion lines, missing entries, etc.", "orig": "tion lines, missing entries, etc.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.931, "r_y0": 333.669, "r_x1": 286.365, "r_y1": 333.669, "r_x2": 286.365, "r_y2": 325.081, "r_x3": 180.931, "r_y3": 325.081, "coord_origin": "TOPLEFT"}, "text": "As such, the correct iden-", "orig": "As such, the correct iden-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 345.624, "r_x1": 85.539, "r_y1": 345.624, "r_x2": 85.539, "r_y2": 337.036, "r_x3": 50.112, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "tification", "orig": "tification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 89.942, "r_y0": 345.624, "r_x1": 97.693, "r_y1": 345.624, "r_x2": 97.693, "r_y2": 337.036, "r_x3": 89.942, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 102.107, "r_y0": 345.624, "r_x1": 114.281, "r_y1": 345.624, "r_x2": 114.281, "r_y2": 337.036, "r_x3": 102.107, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 118.695, "r_y0": 345.624, "r_x1": 177.534, "r_y1": 345.624, "r_x2": 177.534, "r_y2": 337.036, "r_x3": 118.695, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "table-structure", "orig": "table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.947, "r_y0": 345.624, "r_x1": 286.365, "r_y1": 345.624, "r_x2": 286.365, "r_y2": 337.036, "r_x3": 181.947, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "from an image is a non-", "orig": "from an image is a non-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 357.58, "r_x1": 95.791, "r_y1": 357.58, "r_x2": 95.791, "r_y2": 348.992, "r_x3": 50.112, "r_y3": 348.992, "coord_origin": "TOPLEFT"}, "text": "trivial task.", "orig": "trivial task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 99.746, "r_y0": 357.58, "r_x1": 286.365, "r_y1": 357.58, "r_x2": 286.365, "r_y2": 348.992, "r_x3": 99.746, "r_y3": 348.992, "coord_origin": "TOPLEFT"}, "text": "In this paper, we present a new table-structure", "orig": "In this paper, we present a new table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 369.535, "r_x1": 132.443, "r_y1": 369.535, "r_x2": 132.443, "r_y2": 360.947, "r_x3": 50.112, "r_y3": 360.947, "coord_origin": "TOPLEFT"}, "text": "identification model.", "orig": "identification model.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 136.777, "r_y0": 369.535, "r_x1": 286.365, "r_y1": 369.535, "r_x2": 286.365, "r_y2": 360.947, "r_x3": 136.777, "r_y3": 360.947, "coord_origin": "TOPLEFT"}, "text": "The latter improves the latest end-to-", "orig": "The latter improves the latest end-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 381.49, "r_x1": 170.4, "r_y1": 381.49, "r_x2": 170.4, "r_y2": 372.902, "r_x3": 50.112, "r_y3": 372.902, "coord_origin": "TOPLEFT"}, "text": "end deep learning model (i.e.", "orig": "end deep learning model (i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.248, "r_y0": 381.49, "r_x1": 286.365, "r_y1": 381.49, "r_x2": 286.365, "r_y2": 372.902, "r_x3": 176.248, "r_y3": 372.902, "coord_origin": "TOPLEFT"}, "text": "encoder-dual-decoder from", "orig": "encoder-dual-decoder from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 393.445, "r_x1": 196.572, "r_y1": 393.445, "r_x2": 196.572, "r_y2": 384.857, "r_x3": 50.112, "r_y3": 384.857, "coord_origin": "TOPLEFT"}, "text": "PubTabNet) in two significant ways.", "orig": "PubTabNet) in two significant ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 201.643, "r_y0": 393.445, "r_x1": 286.365, "r_y1": 393.445, "r_x2": 286.365, "r_y2": 384.857, "r_x3": 201.643, "r_y3": 384.857, "coord_origin": "TOPLEFT"}, "text": "First, we introduce a", "orig": "First, we introduce a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 405.4, "r_x1": 232.328, "r_y1": 405.4, "r_x2": 232.328, "r_y2": 396.812, "r_x3": 50.112, "r_y3": 396.812, "coord_origin": "TOPLEFT"}, "text": "new object detection decoder for table-cells.", "orig": "new object detection decoder for table-cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 238.584, "r_y0": 405.4, "r_x1": 286.365, "r_y1": 405.4, "r_x2": 286.365, "r_y2": 396.812, "r_x3": 238.584, "r_y3": 396.812, "coord_origin": "TOPLEFT"}, "text": "In this way,", "orig": "In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 417.355, "r_x1": 286.365, "r_y1": 417.355, "r_x2": 286.365, "r_y2": 408.767, "r_x3": 50.112, "r_y3": 408.767, "coord_origin": "TOPLEFT"}, "text": "we can obtain the content of the table-cells from program-", "orig": "we can obtain the content of the table-cells from program-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 429.311, "r_x1": 286.365, "r_y1": 429.311, "r_x2": 286.365, "r_y2": 420.723, "r_x3": 50.112, "r_y3": 420.723, "coord_origin": "TOPLEFT"}, "text": "matic PDF's directly from the PDF source and avoid the", "orig": "matic PDF's directly from the PDF source and avoid the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 441.266, "r_x1": 207.232, "r_y1": 441.266, "r_x2": 207.232, "r_y2": 432.678, "r_x3": 50.112, "r_y3": 432.678, "coord_origin": "TOPLEFT"}, "text": "training of the custom OCR decoders.", "orig": "training of the custom OCR decoders.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.096, "r_y0": 441.266, "r_x1": 286.365, "r_y1": 441.266, "r_x2": 286.365, "r_y2": 432.678, "r_x3": 214.096, "r_y3": 432.678, "coord_origin": "TOPLEFT"}, "text": "This architectural", "orig": "This architectural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 453.221, "r_x1": 286.365, "r_y1": 453.221, "r_x2": 286.365, "r_y2": 444.633, "r_x3": 50.112, "r_y3": 444.633, "coord_origin": "TOPLEFT"}, "text": "change leads to more accurate table-content extraction and", "orig": "change leads to more accurate table-content extraction and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 465.176, "r_x1": 204.233, "r_y1": 465.176, "r_x2": 204.233, "r_y2": 456.588, "r_x3": 50.112, "r_y3": 456.588, "coord_origin": "TOPLEFT"}, "text": "allows us to tackle non-english tables.", "orig": "allows us to tackle non-english tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.587, "r_y0": 465.176, "r_x1": 286.365, "r_y1": 465.176, "r_x2": 286.365, "r_y2": 456.588, "r_x3": 208.587, "r_y3": 456.588, "coord_origin": "TOPLEFT"}, "text": "Second, we replace", "orig": "Second, we replace", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 477.131, "r_x1": 286.365, "r_y1": 477.131, "r_x2": 286.365, "r_y2": 468.543, "r_x3": 50.112, "r_y3": 468.543, "coord_origin": "TOPLEFT"}, "text": "the LSTM decoders with transformer based decoders. This", "orig": "the LSTM decoders with transformer based decoders. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 489.087, "r_x1": 286.365, "r_y1": 489.087, "r_x2": 286.365, "r_y2": 480.499, "r_x3": 50.112, "r_y3": 480.499, "coord_origin": "TOPLEFT"}, "text": "upgrade improves significantly the previous state-of-the-art", "orig": "upgrade improves significantly the previous state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 501.042, "r_x1": 286.365, "r_y1": 501.042, "r_x2": 286.365, "r_y2": 492.454, "r_x3": 50.112, "r_y3": 492.454, "coord_origin": "TOPLEFT"}, "text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 512.9970000000001, "r_x1": 276.652, "r_y1": 512.9970000000001, "r_x2": 276.652, "r_y2": 504.409, "r_x3": 50.112, "r_y3": 504.409, "coord_origin": "TOPLEFT"}, "text": "simple tables and from 88.7% to 95% on complex tables.", "orig": "simple tables and from 88.7% to 95% on complex tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 550.691, "r_x1": 126.948, "r_y1": 550.691, "r_x2": 126.948, "r_y2": 539.943, "r_x3": 50.112, "r_y3": 539.943, "coord_origin": "TOPLEFT"}, "text": "1. Introduction", "orig": "1. Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 569.604, "r_x1": 166.266, "r_y1": 569.604, "r_x2": 166.266, "r_y2": 561.052, "r_x3": 62.067, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "The occurrence of tables", "orig": "The occurrence of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.759, "r_y0": 569.604, "r_x1": 178.51, "r_y1": 569.604, "r_x2": 178.51, "r_y2": 561.052, "r_x3": 170.759, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.003, "r_y0": 569.604, "r_x1": 286.365, "r_y1": 569.604, "r_x2": 286.365, "r_y2": 561.052, "r_x3": 183.003, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "documents is ubiquitous.", "orig": "documents is ubiquitous.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 581.559, "r_x1": 286.365, "r_y1": 581.559, "r_x2": 286.365, "r_y2": 573.0070000000001, "r_x3": 50.112, "r_y3": 573.0070000000001, "coord_origin": "TOPLEFT"}, "text": "They often summarise quantitative or factual data, which is", "orig": "They often summarise quantitative or factual data, which is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 593.514, "r_x1": 286.365, "r_y1": 593.514, "r_x2": 286.365, "r_y2": 584.962, "r_x3": 50.112, "r_y3": 584.962, "coord_origin": "TOPLEFT"}, "text": "cumbersome to describe in verbose text but nevertheless ex-", "orig": "cumbersome to describe in verbose text but nevertheless ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 605.47, "r_x1": 119.95, "r_y1": 605.47, "r_x2": 119.95, "r_y2": 596.918, "r_x3": 50.112, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "tremely valuable.", "orig": "tremely valuable.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.778, "r_y0": 605.47, "r_x1": 286.365, "r_y1": 605.47, "r_x2": 286.365, "r_y2": 596.918, "r_x3": 125.778, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "Unfortunately, this compact representa-", "orig": "Unfortunately, this compact representa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 617.425, "r_x1": 286.365, "r_y1": 617.425, "r_x2": 286.365, "r_y2": 608.873, "r_x3": 50.112, "r_y3": 608.873, "coord_origin": "TOPLEFT"}, "text": "tion is often not easy to parse by machines. There are many", "orig": "tion is often not easy to parse by machines. There are many", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 629.38, "r_x1": 286.365, "r_y1": 629.38, "r_x2": 286.365, "r_y2": 620.828, "r_x3": 50.112, "r_y3": 620.828, "coord_origin": "TOPLEFT"}, "text": "implicit conventions used to obtain a compact table repre-", "orig": "implicit conventions used to obtain a compact table repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 641.335, "r_x1": 286.365, "r_y1": 641.335, "r_x2": 286.365, "r_y2": 632.783, "r_x3": 50.112, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "sentation. For example, tables often have complex column-", "orig": "sentation. For example, tables often have complex column-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 653.29, "r_x1": 286.365, "r_y1": 653.29, "r_x2": 286.365, "r_y2": 644.738, "r_x3": 50.112, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "and row-headers in order to reduce duplicated cell content.", "orig": "and row-headers in order to reduce duplicated cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 665.245, "r_x1": 286.365, "r_y1": 665.245, "r_x2": 286.365, "r_y2": 656.693, "r_x3": 50.112, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "Lines of different shapes and sizes are leveraged to separate", "orig": "Lines of different shapes and sizes are leveraged to separate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.201, "r_x1": 286.365, "r_y1": 677.201, "r_x2": 286.365, "r_y2": 668.649, "r_x3": 50.112, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "content or indicate a tree structure. Additionally, tables can", "orig": "content or indicate a tree structure. Additionally, tables can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "also have empty/missing table-entries or multi-row textual", "orig": "also have empty/missing table-entries or multi-row textual", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 101.848, "r_y1": 701.111, "r_x2": 101.848, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "table-entries.", "orig": "table-entries.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 106.261, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 106.261, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Fig. 1 shows a table which presents all these", "orig": "Fig. 1 shows a table which presents all these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 76.403, "r_y1": 713.066, "r_x2": 76.403, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "issues.", "orig": "issues.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 226.66200000000003, "r_x1": 408.441, "r_y1": 226.66200000000003, "r_x2": 408.441, "r_y2": 218.34900000000005, "r_x3": 315.567, "r_y3": 218.34900000000005, "coord_origin": "TOPLEFT"}, "text": "a. Picture of a table:", "orig": "a. Picture of a table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 322.35, "r_x1": 486.402, "r_y1": 322.35, "r_x2": 486.402, "r_y2": 314.037, "r_x3": 315.567, "r_y3": 314.037, "coord_origin": "TOPLEFT"}, "text": "b. Red-annotation of bounding boxes,", "orig": "b. Red-annotation of bounding boxes,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.463, "r_y0": 333.15, "r_x1": 472.474, "r_y1": 333.15, "r_x2": 472.474, "r_y2": 324.837, "r_x3": 326.463, "r_y3": 324.837, "coord_origin": "TOPLEFT"}, "text": "Blue-predictions by TableFormer", "orig": "Blue-predictions by TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 428.838, "r_x1": 491.191, "r_y1": 428.838, "r_x2": 491.191, "r_y2": 420.525, "r_x3": 315.567, "r_y3": 420.525, "coord_origin": "TOPLEFT"}, "text": "c. Structure predicted by TableFormer:", "orig": "c. Structure predicted by TableFormer:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.148, "r_y0": 351.356, "r_x1": 412.54, "r_y1": 351.356, "r_x2": 412.54, "r_y2": 343.601, "r_x3": 408.148, "r_y3": 343.601, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.11, "r_y0": 350.099, "r_x1": 360.503, "r_y1": 350.099, "r_x2": 360.503, "r_y2": 342.345, "r_x3": 356.11, "r_y3": 342.345, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.678, "r_y0": 349.465, "r_x1": 505.07, "r_y1": 349.465, "r_x2": 505.07, "r_y2": 341.711, "r_x3": 500.678, "r_y3": 341.711, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.134, "r_y0": 360.275, "r_x1": 360.526, "r_y1": 360.275, "r_x2": 360.526, "r_y2": 352.521, "r_x3": 356.134, "r_y3": 352.521, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 402.54, "r_y0": 364.404, "r_x1": 406.932, "r_y1": 364.404, "r_x2": 406.932, "r_y2": 356.65, "r_x3": 402.54, "r_y3": 356.65, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.582, "r_y0": 361.367, "r_x1": 452.974, "r_y1": 361.367, "r_x2": 452.974, "r_y2": 353.613, "r_x3": 448.582, "r_y3": 353.613, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 491.652, "r_y0": 362.234, "r_x1": 496.044, "r_y1": 362.234, "r_x2": 496.044, "r_y2": 354.48, "r_x3": 491.652, "r_y3": 354.48, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 535.138, "r_y0": 361.867, "r_x1": 539.531, "r_y1": 361.867, "r_x2": 539.531, "r_y2": 354.113, "r_x3": 535.138, "r_y3": 354.113, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.828, "r_y0": 395.625, "r_x1": 353.221, "r_y1": 395.625, "r_x2": 353.221, "r_y2": 387.871, "r_x3": 348.828, "r_y3": 387.871, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 389.272, "r_y0": 383.9, "r_x1": 393.664, "r_y1": 383.9, "r_x2": 393.664, "r_y2": 376.145, "r_x3": 389.272, "r_y3": 376.145, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.675, "r_y0": 384.173, "r_x1": 451.459, "r_y1": 384.173, "r_x2": 451.459, "r_y2": 376.419, "r_x3": 442.675, "r_y3": 376.419, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.438, "r_y0": 384.061, "r_x1": 485.902, "r_y1": 384.061, "r_x2": 485.902, "r_y2": 376.307, "r_x3": 477.438, "r_y3": 376.307, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 522.573, "r_y0": 384.173, "r_x1": 531.357, "r_y1": 384.173, "r_x2": 531.357, "r_y2": 376.419, "r_x3": 522.573, "r_y3": 376.419, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.23, "r_y0": 395.642, "r_x1": 409.014, "r_y1": 395.642, "r_x2": 409.014, "r_y2": 387.887, "r_x3": 400.23, "r_y3": 387.887, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.308, "r_y0": 395.517, "r_x1": 451.092, "r_y1": 395.517, "r_x2": 451.092, "r_y2": 387.763, "r_x3": 442.308, "r_y3": 387.763, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.219, "r_y0": 395.902, "r_x1": 487.003, "r_y1": 395.902, "r_x2": 487.003, "r_y2": 388.148, "r_x3": 478.219, "r_y3": 388.148, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 523.229, "r_y0": 395.517, "r_x1": 532.013, "r_y1": 395.517, "r_x2": 532.013, "r_y2": 387.763, "r_x3": 523.229, "r_y3": 387.763, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.572, "r_y0": 407.952, "r_x1": 420.356, "r_y1": 407.952, "r_x2": 420.356, "r_y2": 400.198, "r_x3": 411.572, "r_y3": 400.198, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.305, "r_y0": 407.564, "r_x1": 451.089, "r_y1": 407.564, "r_x2": 451.089, "r_y2": 399.81, "r_x3": 442.305, "r_y3": 399.81, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.779, "r_y0": 407.524, "r_x1": 487.563, "r_y1": 407.524, "r_x2": 487.563, "r_y2": 399.769, "r_x3": 478.779, "r_y3": 399.769, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 523.972, "r_y0": 407.139, "r_x1": 532.756, "r_y1": 407.139, "r_x2": 532.756, "r_y2": 399.385, "r_x3": 523.972, "r_y3": 399.385, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 446.213, "r_x1": 351.641, "r_y1": 446.213, "r_x2": 351.641, "r_y2": 438.459, "r_x3": 347.249, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.881, "r_y0": 446.213, "r_x1": 323.273, "r_y1": 446.213, "r_x2": 323.273, "r_y2": 438.459, "r_x3": 318.881, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 446.213, "r_x1": 398.497, "r_y1": 446.213, "r_x2": 398.497, "r_y2": 438.459, "r_x3": 394.104, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 458.073, "r_x1": 323.166, "r_y1": 458.073, "r_x2": 323.166, "r_y2": 450.319, "r_x3": 318.773, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 458.073, "r_x1": 351.641, "r_y1": 458.073, "r_x2": 351.641, "r_y2": 450.319, "r_x3": 347.249, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 458.073, "r_x1": 398.497, "r_y1": 458.073, "r_x2": 398.497, "r_y2": 450.319, "r_x3": 394.104, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 458.073, "r_x1": 445.352, "r_y1": 458.073, "r_x2": 445.352, "r_y2": 450.319, "r_x3": 440.959, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 458.073, "r_x1": 492.207, "r_y1": 458.073, "r_x2": 492.207, "r_y2": 450.319, "r_x3": 487.815, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 482.232, "r_x1": 323.166, "r_y1": 482.232, "r_x2": 323.166, "r_y2": 474.477, "r_x3": 318.773, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 470.372, "r_x1": 351.641, "r_y1": 470.372, "r_x2": 351.641, "r_y2": 462.618, "r_x3": 347.249, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 470.372, "r_x1": 402.888, "r_y1": 470.372, "r_x2": 402.888, "r_y2": 462.618, "r_x3": 394.104, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 470.372, "r_x1": 449.423, "r_y1": 470.372, "r_x2": 449.423, "r_y2": 462.618, "r_x3": 440.959, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 470.372, "r_x1": 496.599, "r_y1": 470.372, "r_x2": 496.599, "r_y2": 462.618, "r_x3": 487.815, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 482.232, "r_x1": 356.033, "r_y1": 482.232, "r_x2": 356.033, "r_y2": 474.477, "r_x3": 347.249, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 482.232, "r_x1": 402.888, "r_y1": 482.232, "r_x2": 402.888, "r_y2": 474.477, "r_x3": 394.104, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 482.232, "r_x1": 449.743, "r_y1": 482.232, "r_x2": 449.743, "r_y2": 474.477, "r_x3": 440.959, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 482.232, "r_x1": 496.599, "r_y1": 482.232, "r_x2": 496.599, "r_y2": 474.477, "r_x3": 487.815, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 493.652, "r_x1": 356.033, "r_y1": 493.652, "r_x2": 356.033, "r_y2": 485.898, "r_x3": 347.249, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 493.652, "r_x1": 402.888, "r_y1": 493.652, "r_x2": 402.888, "r_y2": 485.898, "r_x3": 394.104, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 493.652, "r_x1": 449.743, "r_y1": 493.652, "r_x2": 449.743, "r_y2": 485.898, "r_x3": 440.959, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 493.652, "r_x1": 496.599, "r_y1": 493.652, "r_x2": 496.599, "r_y2": 485.898, "r_x3": 487.815, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.946, "r_y0": 245.44000000000005, "r_x1": 457.951, "r_y1": 245.44000000000005, "r_x2": 457.951, "r_y2": 235.47699999999998, "r_x3": 451.946, "r_y3": 235.47699999999998, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.094, "r_y0": 367.853, "r_x1": 391.099, "r_y1": 367.853, "r_x2": 391.099, "r_y2": 357.89, "r_x3": 385.094, "r_y3": 357.89, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.701, "r_y0": 459.214, "r_x1": 372.706, "r_y1": 459.214, "r_x2": 372.706, "r_y2": 449.25, "r_x3": 366.701, "r_y3": 449.25, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.197, "r_y0": 279.446, "r_x1": 337.202, "r_y1": 279.446, "r_x2": 337.202, "r_y2": 269.48199999999997, "r_x3": 331.197, "r_y3": 269.48199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.435, "r_y0": 390.82, "r_x1": 339.439, "r_y1": 390.82, "r_x2": 339.439, "r_y2": 380.856, "r_x3": 333.435, "r_y3": 380.856, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.904, "r_y0": 483.416, "r_x1": 337.909, "r_y1": 483.416, "r_x2": 337.909, "r_y2": 473.452, "r_x3": 331.904, "r_y3": 473.452, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.072, "r_y0": 351.13, "r_x1": 484.077, "r_y1": 351.13, "r_x2": 484.077, "r_y2": 341.166, "r_x3": 478.072, "r_y3": 341.166, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.876, "r_y0": 447.687, "r_x1": 465.881, "r_y1": 447.687, "r_x2": 465.881, "r_y2": 437.723, "r_x3": 459.876, "r_y3": 437.723, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.033, "r_y0": 262.77200000000005, "r_x1": 390.038, "r_y1": 262.77200000000005, "r_x2": 390.038, "r_y2": 252.80899999999997, "r_x3": 384.033, "r_y3": 252.80899999999997, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 523.321, "r_x1": 345.734, "r_y1": 523.321, "r_x2": 345.734, "r_y2": 514.769, "r_x3": 308.862, "r_y3": 514.769, "coord_origin": "TOPLEFT"}, "text": "Figure 1:", "orig": "Figure 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 353.176, "r_y0": 523.321, "r_x1": 545.115, "r_y1": 523.321, "r_x2": 545.115, "r_y2": 514.769, "r_x3": 353.176, "r_y3": 514.769, "coord_origin": "TOPLEFT"}, "text": "Picture of a table with subtle, complex features", "orig": "Picture of a table with subtle, complex features", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 535.2760000000001, "r_x1": 545.115, "r_y1": 535.2760000000001, "r_x2": 545.115, "r_y2": 526.7239999999999, "r_x3": 308.862, "r_y3": 526.7239999999999, "coord_origin": "TOPLEFT"}, "text": "such as (1) multi-column headers, (2) cell with multi-row", "orig": "such as (1) multi-column headers, (2) cell with multi-row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 547.231, "r_x1": 445.539, "r_y1": 547.231, "r_x2": 445.539, "r_y2": 538.679, "r_x3": 308.862, "r_y3": 538.679, "coord_origin": "TOPLEFT"}, "text": "text and (3) cells with no content.", "orig": "text and (3) cells with no content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.221, "r_y0": 547.231, "r_x1": 545.115, "r_y1": 547.231, "r_x2": 545.115, "r_y2": 538.679, "r_x3": 450.221, "r_y3": 538.679, "coord_origin": "TOPLEFT"}, "text": "Image from PubTabNet", "orig": "Image from PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 559.187, "r_x1": 505.692, "r_y1": 559.187, "r_x2": 505.692, "r_y2": 550.635, "r_x3": 308.862, "r_y3": 550.635, "coord_origin": "TOPLEFT"}, "text": "evaluation set, filename: 'PMC2944238 004 02'.", "orig": "evaluation set, filename: 'PMC2944238 004 02'.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 593.23, "r_x1": 358.077, "r_y1": 593.23, "r_x2": 358.077, "r_y2": 584.678, "r_x3": 320.817, "r_y3": 584.678, "coord_origin": "TOPLEFT"}, "text": "Recently,", "orig": "Recently,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.62, "r_y0": 593.23, "r_x1": 404.134, "r_y1": 593.23, "r_x2": 404.134, "r_y2": 584.678, "r_x3": 362.62, "r_y3": 584.678, "coord_origin": "TOPLEFT"}, "text": "significant", "orig": "significant", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.259, "r_y0": 593.23, "r_x1": 545.115, "r_y1": 593.23, "r_x2": 545.115, "r_y2": 584.678, "r_x3": 408.259, "r_y3": 584.678, "coord_origin": "TOPLEFT"}, "text": "progress has been made with vi-", "orig": "progress has been made with vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.185, "r_x1": 526.365, "r_y1": 605.185, "r_x2": 526.365, "r_y2": 596.633, "r_x3": 308.862, "r_y3": 596.633, "coord_origin": "TOPLEFT"}, "text": "sion based approaches to extract tables in documents.", "orig": "sion based approaches to extract tables in documents.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 531.426, "r_y0": 605.185, "r_x1": 545.115, "r_y1": 605.185, "r_x2": 545.115, "r_y2": 596.633, "r_x3": 531.426, "r_y3": 596.633, "coord_origin": "TOPLEFT"}, "text": "For", "orig": "For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.14, "r_x1": 545.115, "r_y1": 617.14, "r_x2": 545.115, "r_y2": 608.588, "r_x3": 308.862, "r_y3": 608.588, "coord_origin": "TOPLEFT"}, "text": "the sake of completeness, the issue of table extraction from", "orig": "the sake of completeness, the issue of table extraction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.095, "r_x1": 545.115, "r_y1": 629.095, "r_x2": 545.115, "r_y2": 620.543, "r_x3": 308.862, "r_y3": 620.543, "coord_origin": "TOPLEFT"}, "text": "documents is typically decomposed into two separate chal-", "orig": "documents is typically decomposed into two separate chal-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.0509999999999, "r_x1": 336.807, "r_y1": 641.0509999999999, "r_x2": 336.807, "r_y2": 632.499, "r_x3": 308.862, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "lenges,", "orig": "lenges,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.519, "r_y0": 641.0509999999999, "r_x1": 353.694, "r_y1": 641.0509999999999, "r_x2": 353.694, "r_y2": 632.499, "r_x3": 341.519, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "i.e.", "orig": "i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.112, "r_y0": 641.0509999999999, "r_x1": 373.728, "r_y1": 641.0509999999999, "r_x2": 373.728, "r_y2": 632.499, "r_x3": 362.112, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.992, "r_y0": 641.0509999999999, "r_x1": 406.226, "r_y1": 641.0509999999999, "r_x2": 406.226, "r_y2": 632.499, "r_x3": 377.992, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "finding", "orig": "finding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.5, "r_y0": 641.0509999999999, "r_x1": 422.675, "r_y1": 641.0509999999999, "r_x2": 422.675, "r_y2": 632.499, "r_x3": 410.5, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.939, "r_y0": 641.0509999999999, "r_x1": 459.038, "r_y1": 641.0509999999999, "r_x2": 459.038, "r_y2": 632.499, "r_x3": 426.939, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "location", "orig": "location", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.302, "r_y0": 641.0509999999999, "r_x1": 471.601, "r_y1": 641.0509999999999, "r_x2": 471.601, "r_y2": 632.499, "r_x3": 463.302, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.875, "r_y0": 641.0509999999999, "r_x1": 488.049, "r_y1": 641.0509999999999, "r_x2": 488.049, "r_y2": 632.499, "r_x3": 475.875, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 492.313, "r_y0": 641.0509999999999, "r_x1": 522.191, "r_y1": 641.0509999999999, "r_x2": 522.191, "r_y2": 632.499, "r_x3": 492.313, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "table(s)", "orig": "table(s)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 526.455, "r_y0": 641.0509999999999, "r_x1": 545.115, "r_y1": 641.0509999999999, "r_x2": 545.115, "r_y2": 632.499, "r_x3": 526.455, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "on a", "orig": "on a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.006, "r_x1": 545.115, "r_y1": 653.006, "r_x2": 545.115, "r_y2": 644.454, "r_x3": 308.862, "r_y3": 644.454, "coord_origin": "TOPLEFT"}, "text": "document-page and (2) finding the structure of a given table", "orig": "document-page and (2) finding the structure of a given table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 664.961, "r_x1": 375.552, "r_y1": 664.961, "r_x2": 375.552, "r_y2": 656.409, "r_x3": 308.862, "r_y3": 656.409, "coord_origin": "TOPLEFT"}, "text": "in the document.", "orig": "in the document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 320.817, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "The first problem is called table-location and has been", "orig": "The first problem is called table-location and has been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 308.862, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 474.261, "r_y1": 701.111, "r_x2": 474.261, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "of-the-art object-detection networks (e.g.", "orig": "of-the-art object-detection networks (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 479.342, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 479.342, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "YOLO and later", "orig": "YOLO and later", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 395.796, "r_y1": 713.066, "r_x2": 395.796, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "on Mask-RCNN [9]).", "orig": "on Mask-RCNN [9]).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.046, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 401.046, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "For all practical purposes, it can be", "orig": "For all practical purposes, it can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 560.0, "r_x1": 36.34, "r_y1": 380.0, "r_x2": 18.34, "r_y2": 380.0, "r_x3": 18.34, "r_y3": 560.0, "coord_origin": "TOPLEFT"}, "text": "arXiv:2203.01017v2", "orig": "arXiv:2203.01017v2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 360.0, "r_x1": 36.34, "r_y1": 290.0, "r_x2": 18.34, "r_y2": 290.0, "r_x3": 18.34, "r_y3": 360.0, "coord_origin": "TOPLEFT"}, "text": "[cs.CV]", "orig": "[cs.CV]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 270.0, "r_x1": 36.34, "r_y1": 250.0, "r_x2": 18.34, "r_y2": 250.0, "r_x3": 18.34, "r_y3": 270.0, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 240.0, "r_x1": 36.34, "r_y1": 210.0, "r_x2": 18.34, "r_y2": 210.0, "r_x3": 18.34, "r_y3": 240.0, "coord_origin": "TOPLEFT"}, "text": "Mar", "orig": "Mar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 200.0, "r_x1": 36.34, "r_y1": 160.0, "r_x2": 18.34, "r_y2": 160.0, "r_x3": 18.34, "r_y3": 200.0, "coord_origin": "TOPLEFT"}, "text": "2022", "orig": "2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 8, "label": "section_header", "bbox": {"l": 96.301, "t": 107.03399999999999, "r": 498.927, "b": 119.93100000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8868067860603333, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.301, "r_y0": 119.93100000000004, "r_x1": 498.927, "r_y1": 119.93100000000004, "r_x2": 498.927, "r_y2": 107.03399999999999, "r_x3": 96.301, "r_y3": 107.03399999999999, "coord_origin": "TOPLEFT"}, "text": "TableFormer: Table Structure Understanding with Transformers.", "orig": "TableFormer: Table Structure Understanding with Transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "section_header", "bbox": {"l": 142.477, "t": 147.00800000000004, "r": 452.75, "b": 171.21699999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.7586215734481812, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.477, "r_y0": 157.26999999999998, "r_x1": 452.75, "r_y1": 157.26999999999998, "r_x2": 452.75, "r_y2": 147.00800000000004, "r_x3": 142.477, "r_y3": 147.00800000000004, "coord_origin": "TOPLEFT"}, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.918, "r_y0": 171.21699999999998, "r_x1": 332.306, "r_y1": 171.21699999999998, "r_x2": 332.306, "r_y2": 160.95500000000004, "r_x3": 262.918, "r_y3": 160.95500000000004, "coord_origin": "TOPLEFT"}, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "key_value_region", "bbox": {"l": 208.123, "t": 176.562, "r": 378.733, "b": 184.26999999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.4854728579521179, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.123, "r_y0": 184.26999999999998, "r_x1": 212.731, "r_y1": 184.26999999999998, "r_x2": 212.731, "r_y2": 176.562, "r_x3": 208.123, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.73, "r_y0": 183.861, "r_x1": 378.733, "r_y1": 183.861, "r_x2": 378.733, "r_y2": 177.692, "r_x3": 212.73, "r_y3": 177.692, "coord_origin": "TOPLEFT"}, "text": "ahn,nli,mly,taa @zurich.ibm.com", "orig": "ahn,nli,mly,taa @zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.428, "r_y0": 184.26999999999998, "r_x1": 298.036, "r_y1": 184.26999999999998, "r_x2": 298.036, "r_y2": 176.562, "r_x3": 293.428, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 7, "label": "text", "bbox": {"l": 208.123, "t": 176.562, "r": 378.733, "b": 184.26999999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9096331596374512, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.123, "r_y0": 184.26999999999998, "r_x1": 212.731, "r_y1": 184.26999999999998, "r_x2": 212.731, "r_y2": 176.562, "r_x3": 208.123, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.73, "r_y0": 183.861, "r_x1": 378.733, "r_y1": 183.861, "r_x2": 378.733, "r_y2": 177.692, "r_x3": 212.73, "r_y3": 177.692, "coord_origin": "TOPLEFT"}, "text": "ahn,nli,mly,taa @zurich.ibm.com", "orig": "ahn,nli,mly,taa @zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.428, "r_y0": 184.26999999999998, "r_x1": 298.036, "r_y1": 184.26999999999998, "r_x2": 298.036, "r_y2": 176.562, "r_x3": 293.428, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 5, "label": "section_header", "bbox": {"l": 145.995, "t": 215.48299999999995, "r": 190.48, "b": 226.231, "coord_origin": "TOPLEFT"}, "confidence": 0.9258671402931213, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.995, "r_y0": 226.231, "r_x1": 190.48, "r_y1": 226.231, "r_x2": 190.48, "r_y2": 215.48299999999995, "r_x3": 145.995, "r_y3": 215.48299999999995, "coord_origin": "TOPLEFT"}, "text": "Abstract", "orig": "Abstract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 50.112, "t": 241.39499999999998, "r": 286.365, "b": 512.9970000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9838882088661194, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 249.98299999999995, "r_x1": 286.365, "r_y1": 249.98299999999995, "r_x2": 286.365, "r_y2": 241.39499999999998, "r_x3": 62.067, "r_y3": 241.39499999999998, "coord_origin": "TOPLEFT"}, "text": "Tables organize valuable content in a concise and com-", "orig": "Tables organize valuable content in a concise and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 261.938, "r_x1": 130.062, "r_y1": 261.938, "r_x2": 130.062, "r_y2": 253.35000000000002, "r_x3": 50.112, "r_y3": 253.35000000000002, "coord_origin": "TOPLEFT"}, "text": "pact representation.", "orig": "pact representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.475, "r_y0": 261.938, "r_x1": 286.365, "r_y1": 261.938, "r_x2": 286.365, "r_y2": 253.35000000000002, "r_x3": 134.475, "r_y3": 253.35000000000002, "coord_origin": "TOPLEFT"}, "text": "This content is extremely valuable for", "orig": "This content is extremely valuable for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 273.89300000000003, "r_x1": 286.365, "r_y1": 273.89300000000003, "r_x2": 286.365, "r_y2": 265.30499999999995, "r_x3": 50.112, "r_y3": 265.30499999999995, "coord_origin": "TOPLEFT"}, "text": "systems such as search engines, Knowledge Graph's, etc,", "orig": "systems such as search engines, Knowledge Graph's, etc,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 285.849, "r_x1": 245.18, "r_y1": 285.849, "r_x2": 245.18, "r_y2": 277.26099999999997, "r_x3": 50.112, "r_y3": 277.26099999999997, "coord_origin": "TOPLEFT"}, "text": "since they enhance their predictive capabilities.", "orig": "since they enhance their predictive capabilities.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.496, "r_y0": 285.849, "r_x1": 286.365, "r_y1": 285.849, "r_x2": 286.365, "r_y2": 277.26099999999997, "r_x3": 251.496, "r_y3": 277.26099999999997, "coord_origin": "TOPLEFT"}, "text": "Unfortu-", "orig": "Unfortu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 297.804, "r_x1": 286.365, "r_y1": 297.804, "r_x2": 286.365, "r_y2": 289.216, "r_x3": 50.112, "r_y3": 289.216, "coord_origin": "TOPLEFT"}, "text": "nately, tables come in a large variety of shapes and sizes.", "orig": "nately, tables come in a large variety of shapes and sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 309.759, "r_x1": 103.601, "r_y1": 309.759, "r_x2": 103.601, "r_y2": 301.171, "r_x3": 50.112, "r_y3": 301.171, "coord_origin": "TOPLEFT"}, "text": "Furthermore,", "orig": "Furthermore,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 108.393, "r_y0": 309.759, "r_x1": 124.692, "r_y1": 309.759, "r_x2": 124.692, "r_y2": 301.171, "r_x3": 108.393, "r_y3": 301.171, "coord_origin": "TOPLEFT"}, "text": "they", "orig": "they", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.026, "r_y0": 309.759, "r_x1": 286.365, "r_y1": 309.759, "r_x2": 286.365, "r_y2": 301.171, "r_x3": 129.026, "r_y3": 301.171, "coord_origin": "TOPLEFT"}, "text": "can have complex column/row-header", "orig": "can have complex column/row-header", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 321.714, "r_x1": 286.365, "r_y1": 321.714, "r_x2": 286.365, "r_y2": 313.126, "r_x3": 50.112, "r_y3": 313.126, "coord_origin": "TOPLEFT"}, "text": "configurations, multiline rows, different variety of separa-", "orig": "configurations, multiline rows, different variety of separa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 333.669, "r_x1": 175.123, "r_y1": 333.669, "r_x2": 175.123, "r_y2": 325.081, "r_x3": 50.112, "r_y3": 325.081, "coord_origin": "TOPLEFT"}, "text": "tion lines, missing entries, etc.", "orig": "tion lines, missing entries, etc.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.931, "r_y0": 333.669, "r_x1": 286.365, "r_y1": 333.669, "r_x2": 286.365, "r_y2": 325.081, "r_x3": 180.931, "r_y3": 325.081, "coord_origin": "TOPLEFT"}, "text": "As such, the correct iden-", "orig": "As such, the correct iden-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 345.624, "r_x1": 85.539, "r_y1": 345.624, "r_x2": 85.539, "r_y2": 337.036, "r_x3": 50.112, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "tification", "orig": "tification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 89.942, "r_y0": 345.624, "r_x1": 97.693, "r_y1": 345.624, "r_x2": 97.693, "r_y2": 337.036, "r_x3": 89.942, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 102.107, "r_y0": 345.624, "r_x1": 114.281, "r_y1": 345.624, "r_x2": 114.281, "r_y2": 337.036, "r_x3": 102.107, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 118.695, "r_y0": 345.624, "r_x1": 177.534, "r_y1": 345.624, "r_x2": 177.534, "r_y2": 337.036, "r_x3": 118.695, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "table-structure", "orig": "table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.947, "r_y0": 345.624, "r_x1": 286.365, "r_y1": 345.624, "r_x2": 286.365, "r_y2": 337.036, "r_x3": 181.947, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "from an image is a non-", "orig": "from an image is a non-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 357.58, "r_x1": 95.791, "r_y1": 357.58, "r_x2": 95.791, "r_y2": 348.992, "r_x3": 50.112, "r_y3": 348.992, "coord_origin": "TOPLEFT"}, "text": "trivial task.", "orig": "trivial task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 99.746, "r_y0": 357.58, "r_x1": 286.365, "r_y1": 357.58, "r_x2": 286.365, "r_y2": 348.992, "r_x3": 99.746, "r_y3": 348.992, "coord_origin": "TOPLEFT"}, "text": "In this paper, we present a new table-structure", "orig": "In this paper, we present a new table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 369.535, "r_x1": 132.443, "r_y1": 369.535, "r_x2": 132.443, "r_y2": 360.947, "r_x3": 50.112, "r_y3": 360.947, "coord_origin": "TOPLEFT"}, "text": "identification model.", "orig": "identification model.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 136.777, "r_y0": 369.535, "r_x1": 286.365, "r_y1": 369.535, "r_x2": 286.365, "r_y2": 360.947, "r_x3": 136.777, "r_y3": 360.947, "coord_origin": "TOPLEFT"}, "text": "The latter improves the latest end-to-", "orig": "The latter improves the latest end-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 381.49, "r_x1": 170.4, "r_y1": 381.49, "r_x2": 170.4, "r_y2": 372.902, "r_x3": 50.112, "r_y3": 372.902, "coord_origin": "TOPLEFT"}, "text": "end deep learning model (i.e.", "orig": "end deep learning model (i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.248, "r_y0": 381.49, "r_x1": 286.365, "r_y1": 381.49, "r_x2": 286.365, "r_y2": 372.902, "r_x3": 176.248, "r_y3": 372.902, "coord_origin": "TOPLEFT"}, "text": "encoder-dual-decoder from", "orig": "encoder-dual-decoder from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 393.445, "r_x1": 196.572, "r_y1": 393.445, "r_x2": 196.572, "r_y2": 384.857, "r_x3": 50.112, "r_y3": 384.857, "coord_origin": "TOPLEFT"}, "text": "PubTabNet) in two significant ways.", "orig": "PubTabNet) in two significant ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 201.643, "r_y0": 393.445, "r_x1": 286.365, "r_y1": 393.445, "r_x2": 286.365, "r_y2": 384.857, "r_x3": 201.643, "r_y3": 384.857, "coord_origin": "TOPLEFT"}, "text": "First, we introduce a", "orig": "First, we introduce a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 405.4, "r_x1": 232.328, "r_y1": 405.4, "r_x2": 232.328, "r_y2": 396.812, "r_x3": 50.112, "r_y3": 396.812, "coord_origin": "TOPLEFT"}, "text": "new object detection decoder for table-cells.", "orig": "new object detection decoder for table-cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 238.584, "r_y0": 405.4, "r_x1": 286.365, "r_y1": 405.4, "r_x2": 286.365, "r_y2": 396.812, "r_x3": 238.584, "r_y3": 396.812, "coord_origin": "TOPLEFT"}, "text": "In this way,", "orig": "In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 417.355, "r_x1": 286.365, "r_y1": 417.355, "r_x2": 286.365, "r_y2": 408.767, "r_x3": 50.112, "r_y3": 408.767, "coord_origin": "TOPLEFT"}, "text": "we can obtain the content of the table-cells from program-", "orig": "we can obtain the content of the table-cells from program-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 429.311, "r_x1": 286.365, "r_y1": 429.311, "r_x2": 286.365, "r_y2": 420.723, "r_x3": 50.112, "r_y3": 420.723, "coord_origin": "TOPLEFT"}, "text": "matic PDF's directly from the PDF source and avoid the", "orig": "matic PDF's directly from the PDF source and avoid the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 441.266, "r_x1": 207.232, "r_y1": 441.266, "r_x2": 207.232, "r_y2": 432.678, "r_x3": 50.112, "r_y3": 432.678, "coord_origin": "TOPLEFT"}, "text": "training of the custom OCR decoders.", "orig": "training of the custom OCR decoders.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.096, "r_y0": 441.266, "r_x1": 286.365, "r_y1": 441.266, "r_x2": 286.365, "r_y2": 432.678, "r_x3": 214.096, "r_y3": 432.678, "coord_origin": "TOPLEFT"}, "text": "This architectural", "orig": "This architectural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 453.221, "r_x1": 286.365, "r_y1": 453.221, "r_x2": 286.365, "r_y2": 444.633, "r_x3": 50.112, "r_y3": 444.633, "coord_origin": "TOPLEFT"}, "text": "change leads to more accurate table-content extraction and", "orig": "change leads to more accurate table-content extraction and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 465.176, "r_x1": 204.233, "r_y1": 465.176, "r_x2": 204.233, "r_y2": 456.588, "r_x3": 50.112, "r_y3": 456.588, "coord_origin": "TOPLEFT"}, "text": "allows us to tackle non-english tables.", "orig": "allows us to tackle non-english tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.587, "r_y0": 465.176, "r_x1": 286.365, "r_y1": 465.176, "r_x2": 286.365, "r_y2": 456.588, "r_x3": 208.587, "r_y3": 456.588, "coord_origin": "TOPLEFT"}, "text": "Second, we replace", "orig": "Second, we replace", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 477.131, "r_x1": 286.365, "r_y1": 477.131, "r_x2": 286.365, "r_y2": 468.543, "r_x3": 50.112, "r_y3": 468.543, "coord_origin": "TOPLEFT"}, "text": "the LSTM decoders with transformer based decoders. This", "orig": "the LSTM decoders with transformer based decoders. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 489.087, "r_x1": 286.365, "r_y1": 489.087, "r_x2": 286.365, "r_y2": 480.499, "r_x3": 50.112, "r_y3": 480.499, "coord_origin": "TOPLEFT"}, "text": "upgrade improves significantly the previous state-of-the-art", "orig": "upgrade improves significantly the previous state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 501.042, "r_x1": 286.365, "r_y1": 501.042, "r_x2": 286.365, "r_y2": 492.454, "r_x3": 50.112, "r_y3": 492.454, "coord_origin": "TOPLEFT"}, "text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 512.9970000000001, "r_x1": 276.652, "r_y1": 512.9970000000001, "r_x2": 276.652, "r_y2": 504.409, "r_x3": 50.112, "r_y3": 504.409, "coord_origin": "TOPLEFT"}, "text": "simple tables and from 88.7% to 95% on complex tables.", "orig": "simple tables and from 88.7% to 95% on complex tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "section_header", "bbox": {"l": 50.112, "t": 539.943, "r": 126.948, "b": 550.691, "coord_origin": "TOPLEFT"}, "confidence": 0.9317677617073059, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 550.691, "r_x1": 126.948, "r_y1": 550.691, "r_x2": 126.948, "r_y2": 539.943, "r_x3": 50.112, "r_y3": 539.943, "coord_origin": "TOPLEFT"}, "text": "1. Introduction", "orig": "1. Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 50.112, "t": 561.052, "r": 286.365, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9841895699501038, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 569.604, "r_x1": 166.266, "r_y1": 569.604, "r_x2": 166.266, "r_y2": 561.052, "r_x3": 62.067, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "The occurrence of tables", "orig": "The occurrence of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.759, "r_y0": 569.604, "r_x1": 178.51, "r_y1": 569.604, "r_x2": 178.51, "r_y2": 561.052, "r_x3": 170.759, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.003, "r_y0": 569.604, "r_x1": 286.365, "r_y1": 569.604, "r_x2": 286.365, "r_y2": 561.052, "r_x3": 183.003, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "documents is ubiquitous.", "orig": "documents is ubiquitous.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 581.559, "r_x1": 286.365, "r_y1": 581.559, "r_x2": 286.365, "r_y2": 573.0070000000001, "r_x3": 50.112, "r_y3": 573.0070000000001, "coord_origin": "TOPLEFT"}, "text": "They often summarise quantitative or factual data, which is", "orig": "They often summarise quantitative or factual data, which is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 593.514, "r_x1": 286.365, "r_y1": 593.514, "r_x2": 286.365, "r_y2": 584.962, "r_x3": 50.112, "r_y3": 584.962, "coord_origin": "TOPLEFT"}, "text": "cumbersome to describe in verbose text but nevertheless ex-", "orig": "cumbersome to describe in verbose text but nevertheless ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 605.47, "r_x1": 119.95, "r_y1": 605.47, "r_x2": 119.95, "r_y2": 596.918, "r_x3": 50.112, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "tremely valuable.", "orig": "tremely valuable.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.778, "r_y0": 605.47, "r_x1": 286.365, "r_y1": 605.47, "r_x2": 286.365, "r_y2": 596.918, "r_x3": 125.778, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "Unfortunately, this compact representa-", "orig": "Unfortunately, this compact representa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 617.425, "r_x1": 286.365, "r_y1": 617.425, "r_x2": 286.365, "r_y2": 608.873, "r_x3": 50.112, "r_y3": 608.873, "coord_origin": "TOPLEFT"}, "text": "tion is often not easy to parse by machines. There are many", "orig": "tion is often not easy to parse by machines. There are many", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 629.38, "r_x1": 286.365, "r_y1": 629.38, "r_x2": 286.365, "r_y2": 620.828, "r_x3": 50.112, "r_y3": 620.828, "coord_origin": "TOPLEFT"}, "text": "implicit conventions used to obtain a compact table repre-", "orig": "implicit conventions used to obtain a compact table repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 641.335, "r_x1": 286.365, "r_y1": 641.335, "r_x2": 286.365, "r_y2": 632.783, "r_x3": 50.112, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "sentation. For example, tables often have complex column-", "orig": "sentation. For example, tables often have complex column-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 653.29, "r_x1": 286.365, "r_y1": 653.29, "r_x2": 286.365, "r_y2": 644.738, "r_x3": 50.112, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "and row-headers in order to reduce duplicated cell content.", "orig": "and row-headers in order to reduce duplicated cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 665.245, "r_x1": 286.365, "r_y1": 665.245, "r_x2": 286.365, "r_y2": 656.693, "r_x3": 50.112, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "Lines of different shapes and sizes are leveraged to separate", "orig": "Lines of different shapes and sizes are leveraged to separate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.201, "r_x1": 286.365, "r_y1": 677.201, "r_x2": 286.365, "r_y2": 668.649, "r_x3": 50.112, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "content or indicate a tree structure. Additionally, tables can", "orig": "content or indicate a tree structure. Additionally, tables can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "also have empty/missing table-entries or multi-row textual", "orig": "also have empty/missing table-entries or multi-row textual", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 101.848, "r_y1": 701.111, "r_x2": 101.848, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "table-entries.", "orig": "table-entries.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 106.261, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 106.261, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Fig. 1 shows a table which presents all these", "orig": "Fig. 1 shows a table which presents all these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 76.403, "r_y1": 713.066, "r_x2": 76.403, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "issues.", "orig": "issues.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "section_header", "bbox": {"l": 315.567, "t": 218.34900000000005, "r": 408.441, "b": 226.66200000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.6724023818969727, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 226.66200000000003, "r_x1": 408.441, "r_y1": 226.66200000000003, "r_x2": 408.441, "r_y2": 218.34900000000005, "r_x3": 315.567, "r_y3": 218.34900000000005, "coord_origin": "TOPLEFT"}, "text": "a. Picture of a table:", "orig": "a. Picture of a table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "list_item", "bbox": {"l": 315.567, "t": 314.037, "r": 486.402, "b": 333.15, "coord_origin": "TOPLEFT"}, "confidence": 0.5549328923225403, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 322.35, "r_x1": 486.402, "r_y1": 322.35, "r_x2": 486.402, "r_y2": 314.037, "r_x3": 315.567, "r_y3": 314.037, "coord_origin": "TOPLEFT"}, "text": "b. Red-annotation of bounding boxes,", "orig": "b. Red-annotation of bounding boxes,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.463, "r_y0": 333.15, "r_x1": 472.474, "r_y1": 333.15, "r_x2": 472.474, "r_y2": 324.837, "r_x3": 326.463, "r_y3": 324.837, "coord_origin": "TOPLEFT"}, "text": "Blue-predictions by TableFormer", "orig": "Blue-predictions by TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "list_item", "bbox": {"l": 315.567, "t": 420.525, "r": 491.191, "b": 428.838, "coord_origin": "TOPLEFT"}, "confidence": 0.5501358509063721, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 428.838, "r_x1": 491.191, "r_y1": 428.838, "r_x2": 491.191, "r_y2": 420.525, "r_x3": 315.567, "r_y3": 420.525, "coord_origin": "TOPLEFT"}, "text": "c. Structure predicted by TableFormer:", "orig": "c. Structure predicted by TableFormer:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 10, "label": "picture", "bbox": {"l": 314.78173828125, "t": 338.0652770996094, "r": 539.1802978515625, "b": 410.0494384765625, "coord_origin": "TOPLEFT"}, "confidence": 0.8742761611938477, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.148, "r_y0": 351.356, "r_x1": 412.54, "r_y1": 351.356, "r_x2": 412.54, "r_y2": 343.601, "r_x3": 408.148, "r_y3": 343.601, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.11, "r_y0": 350.099, "r_x1": 360.503, "r_y1": 350.099, "r_x2": 360.503, "r_y2": 342.345, "r_x3": 356.11, "r_y3": 342.345, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.678, "r_y0": 349.465, "r_x1": 505.07, "r_y1": 349.465, "r_x2": 505.07, "r_y2": 341.711, "r_x3": 500.678, "r_y3": 341.711, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.134, "r_y0": 360.275, "r_x1": 360.526, "r_y1": 360.275, "r_x2": 360.526, "r_y2": 352.521, "r_x3": 356.134, "r_y3": 352.521, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 402.54, "r_y0": 364.404, "r_x1": 406.932, "r_y1": 364.404, "r_x2": 406.932, "r_y2": 356.65, "r_x3": 402.54, "r_y3": 356.65, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.582, "r_y0": 361.367, "r_x1": 452.974, "r_y1": 361.367, "r_x2": 452.974, "r_y2": 353.613, "r_x3": 448.582, "r_y3": 353.613, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 491.652, "r_y0": 362.234, "r_x1": 496.044, "r_y1": 362.234, "r_x2": 496.044, "r_y2": 354.48, "r_x3": 491.652, "r_y3": 354.48, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 535.138, "r_y0": 361.867, "r_x1": 539.531, "r_y1": 361.867, "r_x2": 539.531, "r_y2": 354.113, "r_x3": 535.138, "r_y3": 354.113, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.828, "r_y0": 395.625, "r_x1": 353.221, "r_y1": 395.625, "r_x2": 353.221, "r_y2": 387.871, "r_x3": 348.828, "r_y3": 387.871, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 389.272, "r_y0": 383.9, "r_x1": 393.664, "r_y1": 383.9, "r_x2": 393.664, "r_y2": 376.145, "r_x3": 389.272, "r_y3": 376.145, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.675, "r_y0": 384.173, "r_x1": 451.459, "r_y1": 384.173, "r_x2": 451.459, "r_y2": 376.419, "r_x3": 442.675, "r_y3": 376.419, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.438, "r_y0": 384.061, "r_x1": 485.902, "r_y1": 384.061, "r_x2": 485.902, "r_y2": 376.307, "r_x3": 477.438, "r_y3": 376.307, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 522.573, "r_y0": 384.173, "r_x1": 531.357, "r_y1": 384.173, "r_x2": 531.357, "r_y2": 376.419, "r_x3": 522.573, "r_y3": 376.419, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.23, "r_y0": 395.642, "r_x1": 409.014, "r_y1": 395.642, "r_x2": 409.014, "r_y2": 387.887, "r_x3": 400.23, "r_y3": 387.887, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.308, "r_y0": 395.517, "r_x1": 451.092, "r_y1": 395.517, "r_x2": 451.092, "r_y2": 387.763, "r_x3": 442.308, "r_y3": 387.763, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.219, "r_y0": 395.902, "r_x1": 487.003, "r_y1": 395.902, "r_x2": 487.003, "r_y2": 388.148, "r_x3": 478.219, "r_y3": 388.148, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 523.229, "r_y0": 395.517, "r_x1": 532.013, "r_y1": 395.517, "r_x2": 532.013, "r_y2": 387.763, "r_x3": 523.229, "r_y3": 387.763, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.572, "r_y0": 407.952, "r_x1": 420.356, "r_y1": 407.952, "r_x2": 420.356, "r_y2": 400.198, "r_x3": 411.572, "r_y3": 400.198, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.305, "r_y0": 407.564, "r_x1": 451.089, "r_y1": 407.564, "r_x2": 451.089, "r_y2": 399.81, "r_x3": 442.305, "r_y3": 399.81, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.779, "r_y0": 407.524, "r_x1": 487.563, "r_y1": 407.524, "r_x2": 487.563, "r_y2": 399.769, "r_x3": 478.779, "r_y3": 399.769, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 523.972, "r_y0": 407.139, "r_x1": 532.756, "r_y1": 407.139, "r_x2": 532.756, "r_y2": 399.385, "r_x3": 523.972, "r_y3": 399.385, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.094, "r_y0": 367.853, "r_x1": 391.099, "r_y1": 367.853, "r_x2": 391.099, "r_y2": 357.89, "r_x3": 385.094, "r_y3": 357.89, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.435, "r_y0": 390.82, "r_x1": 339.439, "r_y1": 390.82, "r_x2": 339.439, "r_y2": 380.856, "r_x3": 333.435, "r_y3": 380.856, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.072, "r_y0": 351.13, "r_x1": 484.077, "r_y1": 351.13, "r_x2": 484.077, "r_y2": 341.166, "r_x3": 478.072, "r_y3": 341.166, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 40, "label": "text", "bbox": {"l": 408.148, "t": 343.601, "r": 412.54, "b": 351.356, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.148, "r_y0": 351.356, "r_x1": 412.54, "r_y1": 351.356, "r_x2": 412.54, "r_y2": 343.601, "r_x3": 408.148, "r_y3": 343.601, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 356.11, "t": 342.345, "r": 360.503, "b": 350.099, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.11, "r_y0": 350.099, "r_x1": 360.503, "r_y1": 350.099, "r_x2": 360.503, "r_y2": 342.345, "r_x3": 356.11, "r_y3": 342.345, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 500.678, "t": 341.711, "r": 505.07, "b": 349.465, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.678, "r_y0": 349.465, "r_x1": 505.07, "r_y1": 349.465, "r_x2": 505.07, "r_y2": 341.711, "r_x3": 500.678, "r_y3": 341.711, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 356.134, "t": 352.521, "r": 360.526, "b": 360.275, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.134, "r_y0": 360.275, "r_x1": 360.526, "r_y1": 360.275, "r_x2": 360.526, "r_y2": 352.521, "r_x3": 356.134, "r_y3": 352.521, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 402.54, "t": 356.65, "r": 406.932, "b": 364.404, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 402.54, "r_y0": 364.404, "r_x1": 406.932, "r_y1": 364.404, "r_x2": 406.932, "r_y2": 356.65, "r_x3": 402.54, "r_y3": 356.65, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 448.582, "t": 353.613, "r": 452.974, "b": 361.367, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.582, "r_y0": 361.367, "r_x1": 452.974, "r_y1": 361.367, "r_x2": 452.974, "r_y2": 353.613, "r_x3": 448.582, "r_y3": 353.613, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 491.652, "t": 354.48, "r": 496.044, "b": 362.234, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 491.652, "r_y0": 362.234, "r_x1": 496.044, "r_y1": 362.234, "r_x2": 496.044, "r_y2": 354.48, "r_x3": 491.652, "r_y3": 354.48, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 535.138, "t": 354.113, "r": 539.531, "b": 361.867, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 535.138, "r_y0": 361.867, "r_x1": 539.531, "r_y1": 361.867, "r_x2": 539.531, "r_y2": 354.113, "r_x3": 535.138, "r_y3": 354.113, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 348.828, "t": 387.871, "r": 353.221, "b": 395.625, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.828, "r_y0": 395.625, "r_x1": 353.221, "r_y1": 395.625, "r_x2": 353.221, "r_y2": 387.871, "r_x3": 348.828, "r_y3": 387.871, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 389.272, "t": 376.145, "r": 393.664, "b": 383.9, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 389.272, "r_y0": 383.9, "r_x1": 393.664, "r_y1": 383.9, "r_x2": 393.664, "r_y2": 376.145, "r_x3": 389.272, "r_y3": 376.145, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 442.675, "t": 376.419, "r": 451.459, "b": 384.173, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.675, "r_y0": 384.173, "r_x1": 451.459, "r_y1": 384.173, "r_x2": 451.459, "r_y2": 376.419, "r_x3": 442.675, "r_y3": 376.419, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 477.438, "t": 376.307, "r": 485.902, "b": 384.061, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.438, "r_y0": 384.061, "r_x1": 485.902, "r_y1": 384.061, "r_x2": 485.902, "r_y2": 376.307, "r_x3": 477.438, "r_y3": 376.307, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 522.573, "t": 376.419, "r": 531.357, "b": 384.173, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 522.573, "r_y0": 384.173, "r_x1": 531.357, "r_y1": 384.173, "r_x2": 531.357, "r_y2": 376.419, "r_x3": 522.573, "r_y3": 376.419, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 400.23, "t": 387.887, "r": 409.014, "b": 395.642, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.23, "r_y0": 395.642, "r_x1": 409.014, "r_y1": 395.642, "r_x2": 409.014, "r_y2": 387.887, "r_x3": 400.23, "r_y3": 387.887, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 442.308, "t": 387.763, "r": 451.092, "b": 395.517, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.308, "r_y0": 395.517, "r_x1": 451.092, "r_y1": 395.517, "r_x2": 451.092, "r_y2": 387.763, "r_x3": 442.308, "r_y3": 387.763, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 478.219, "t": 388.148, "r": 487.003, "b": 395.902, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.219, "r_y0": 395.902, "r_x1": 487.003, "r_y1": 395.902, "r_x2": 487.003, "r_y2": 388.148, "r_x3": 478.219, "r_y3": 388.148, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 523.229, "t": 387.763, "r": 532.013, "b": 395.517, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 523.229, "r_y0": 395.517, "r_x1": 532.013, "r_y1": 395.517, "r_x2": 532.013, "r_y2": 387.763, "r_x3": 523.229, "r_y3": 387.763, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 411.572, "t": 400.198, "r": 420.356, "b": 407.952, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.572, "r_y0": 407.952, "r_x1": 420.356, "r_y1": 407.952, "r_x2": 420.356, "r_y2": 400.198, "r_x3": 411.572, "r_y3": 400.198, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 442.305, "t": 399.81, "r": 451.089, "b": 407.564, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.305, "r_y0": 407.564, "r_x1": 451.089, "r_y1": 407.564, "r_x2": 451.089, "r_y2": 399.81, "r_x3": 442.305, "r_y3": 399.81, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 478.779, "t": 399.769, "r": 487.563, "b": 407.524, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.779, "r_y0": 407.524, "r_x1": 487.563, "r_y1": 407.524, "r_x2": 487.563, "r_y2": 399.769, "r_x3": 478.779, "r_y3": 399.769, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 523.972, "t": 399.385, "r": 532.756, "b": 407.139, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 523.972, "r_y0": 407.139, "r_x1": 532.756, "r_y1": 407.139, "r_x2": 532.756, "r_y2": 399.385, "r_x3": 523.972, "r_y3": 399.385, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 83, "label": "text", "bbox": {"l": 385.094, "t": 357.89, "r": 391.099, "b": 367.853, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.094, "r_y0": 367.853, "r_x1": 391.099, "r_y1": 367.853, "r_x2": 391.099, "r_y2": 357.89, "r_x3": 385.094, "r_y3": 357.89, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 86, "label": "text", "bbox": {"l": 333.435, "t": 380.856, "r": 339.439, "b": 390.82, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.435, "r_y0": 390.82, "r_x1": 339.439, "r_y1": 390.82, "r_x2": 339.439, "r_y2": 380.856, "r_x3": 333.435, "r_y3": 380.856, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 88, "label": "text", "bbox": {"l": 478.072, "t": 341.166, "r": 484.077, "b": 351.13, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.072, "r_y0": 351.13, "r_x1": 484.077, "r_y1": 351.13, "r_x2": 484.077, "r_y2": 341.166, "r_x3": 478.072, "r_y3": 341.166, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 23, "label": "picture", "bbox": {"l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT"}, "confidence": 0.5088632702827454, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 446.213, "r_x1": 351.641, "r_y1": 446.213, "r_x2": 351.641, "r_y2": 438.459, "r_x3": 347.249, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.881, "r_y0": 446.213, "r_x1": 323.273, "r_y1": 446.213, "r_x2": 323.273, "r_y2": 438.459, "r_x3": 318.881, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 446.213, "r_x1": 398.497, "r_y1": 446.213, "r_x2": 398.497, "r_y2": 438.459, "r_x3": 394.104, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 458.073, "r_x1": 323.166, "r_y1": 458.073, "r_x2": 323.166, "r_y2": 450.319, "r_x3": 318.773, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 458.073, "r_x1": 351.641, "r_y1": 458.073, "r_x2": 351.641, "r_y2": 450.319, "r_x3": 347.249, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 458.073, "r_x1": 398.497, "r_y1": 458.073, "r_x2": 398.497, "r_y2": 450.319, "r_x3": 394.104, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 458.073, "r_x1": 445.352, "r_y1": 458.073, "r_x2": 445.352, "r_y2": 450.319, "r_x3": 440.959, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 458.073, "r_x1": 492.207, "r_y1": 458.073, "r_x2": 492.207, "r_y2": 450.319, "r_x3": 487.815, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 482.232, "r_x1": 323.166, "r_y1": 482.232, "r_x2": 323.166, "r_y2": 474.477, "r_x3": 318.773, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 470.372, "r_x1": 351.641, "r_y1": 470.372, "r_x2": 351.641, "r_y2": 462.618, "r_x3": 347.249, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 470.372, "r_x1": 402.888, "r_y1": 470.372, "r_x2": 402.888, "r_y2": 462.618, "r_x3": 394.104, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 470.372, "r_x1": 449.423, "r_y1": 470.372, "r_x2": 449.423, "r_y2": 462.618, "r_x3": 440.959, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 470.372, "r_x1": 496.599, "r_y1": 470.372, "r_x2": 496.599, "r_y2": 462.618, "r_x3": 487.815, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 482.232, "r_x1": 356.033, "r_y1": 482.232, "r_x2": 356.033, "r_y2": 474.477, "r_x3": 347.249, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 482.232, "r_x1": 402.888, "r_y1": 482.232, "r_x2": 402.888, "r_y2": 474.477, "r_x3": 394.104, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 482.232, "r_x1": 449.743, "r_y1": 482.232, "r_x2": 449.743, "r_y2": 474.477, "r_x3": 440.959, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 482.232, "r_x1": 496.599, "r_y1": 482.232, "r_x2": 496.599, "r_y2": 474.477, "r_x3": 487.815, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 493.652, "r_x1": 356.033, "r_y1": 493.652, "r_x2": 356.033, "r_y2": 485.898, "r_x3": 347.249, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 493.652, "r_x1": 402.888, "r_y1": 493.652, "r_x2": 402.888, "r_y2": 485.898, "r_x3": 394.104, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 493.652, "r_x1": 449.743, "r_y1": 493.652, "r_x2": 449.743, "r_y2": 485.898, "r_x3": 440.959, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 493.652, "r_x1": 496.599, "r_y1": 493.652, "r_x2": 496.599, "r_y2": 485.898, "r_x3": 487.815, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.701, "r_y0": 459.214, "r_x1": 372.706, "r_y1": 459.214, "r_x2": 372.706, "r_y2": 449.25, "r_x3": 366.701, "r_y3": 449.25, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.904, "r_y0": 483.416, "r_x1": 337.909, "r_y1": 483.416, "r_x2": 337.909, "r_y2": 473.452, "r_x3": 331.904, "r_y3": 473.452, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.876, "r_y0": 447.687, "r_x1": 465.881, "r_y1": 447.687, "r_x2": 465.881, "r_y2": 437.723, "r_x3": 459.876, "r_y3": 437.723, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 61, "label": "text", "bbox": {"l": 347.249, "t": 438.459, "r": 351.641, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 446.213, "r_x1": 351.641, "r_y1": 446.213, "r_x2": 351.641, "r_y2": 438.459, "r_x3": 347.249, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 318.881, "t": 438.459, "r": 323.273, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.881, "r_y0": 446.213, "r_x1": 323.273, "r_y1": 446.213, "r_x2": 323.273, "r_y2": 438.459, "r_x3": 318.881, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 394.104, "t": 438.459, "r": 398.497, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 446.213, "r_x1": 398.497, "r_y1": 446.213, "r_x2": 398.497, "r_y2": 438.459, "r_x3": 394.104, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 318.773, "t": 450.319, "r": 323.166, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 458.073, "r_x1": 323.166, "r_y1": 458.073, "r_x2": 323.166, "r_y2": 450.319, "r_x3": 318.773, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 347.249, "t": 450.319, "r": 351.641, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 458.073, "r_x1": 351.641, "r_y1": 458.073, "r_x2": 351.641, "r_y2": 450.319, "r_x3": 347.249, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 394.104, "t": 450.319, "r": 398.497, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 458.073, "r_x1": 398.497, "r_y1": 458.073, "r_x2": 398.497, "r_y2": 450.319, "r_x3": 394.104, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 440.959, "t": 450.319, "r": 445.352, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 458.073, "r_x1": 445.352, "r_y1": 458.073, "r_x2": 445.352, "r_y2": 450.319, "r_x3": 440.959, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 487.815, "t": 450.319, "r": 492.207, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 458.073, "r_x1": 492.207, "r_y1": 458.073, "r_x2": 492.207, "r_y2": 450.319, "r_x3": 487.815, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 318.773, "t": 474.477, "r": 323.166, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 482.232, "r_x1": 323.166, "r_y1": 482.232, "r_x2": 323.166, "r_y2": 474.477, "r_x3": 318.773, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 347.249, "t": 462.618, "r": 351.641, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 470.372, "r_x1": 351.641, "r_y1": 470.372, "r_x2": 351.641, "r_y2": 462.618, "r_x3": 347.249, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 394.104, "t": 462.618, "r": 402.888, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 470.372, "r_x1": 402.888, "r_y1": 470.372, "r_x2": 402.888, "r_y2": 462.618, "r_x3": 394.104, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 440.959, "t": 462.618, "r": 449.423, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 470.372, "r_x1": 449.423, "r_y1": 470.372, "r_x2": 449.423, "r_y2": 462.618, "r_x3": 440.959, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 487.815, "t": 462.618, "r": 496.599, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 470.372, "r_x1": 496.599, "r_y1": 470.372, "r_x2": 496.599, "r_y2": 462.618, "r_x3": 487.815, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 347.249, "t": 474.477, "r": 356.033, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 482.232, "r_x1": 356.033, "r_y1": 482.232, "r_x2": 356.033, "r_y2": 474.477, "r_x3": 347.249, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 394.104, "t": 474.477, "r": 402.888, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 482.232, "r_x1": 402.888, "r_y1": 482.232, "r_x2": 402.888, "r_y2": 474.477, "r_x3": 394.104, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 440.959, "t": 474.477, "r": 449.743, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 482.232, "r_x1": 449.743, "r_y1": 482.232, "r_x2": 449.743, "r_y2": 474.477, "r_x3": 440.959, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 487.815, "t": 474.477, "r": 496.599, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 482.232, "r_x1": 496.599, "r_y1": 482.232, "r_x2": 496.599, "r_y2": 474.477, "r_x3": 487.815, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 347.249, "t": 485.898, "r": 356.033, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 493.652, "r_x1": 356.033, "r_y1": 493.652, "r_x2": 356.033, "r_y2": 485.898, "r_x3": 347.249, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 394.104, "t": 485.898, "r": 402.888, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 493.652, "r_x1": 402.888, "r_y1": 493.652, "r_x2": 402.888, "r_y2": 485.898, "r_x3": 394.104, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 440.959, "t": 485.898, "r": 449.743, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 493.652, "r_x1": 449.743, "r_y1": 493.652, "r_x2": 449.743, "r_y2": 485.898, "r_x3": 440.959, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 487.815, "t": 485.898, "r": 496.599, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 493.652, "r_x1": 496.599, "r_y1": 493.652, "r_x2": 496.599, "r_y2": 485.898, "r_x3": 487.815, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 366.701, "t": 449.25, "r": 372.706, "b": 459.214, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.701, "r_y0": 459.214, "r_x1": 372.706, "r_y1": 459.214, "r_x2": 372.706, "r_y2": 449.25, "r_x3": 366.701, "r_y3": 449.25, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 331.904, "t": 473.452, "r": 337.909, "b": 483.416, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.904, "r_y0": 483.416, "r_x1": 337.909, "r_y1": 483.416, "r_x2": 337.909, "r_y2": 473.452, "r_x3": 331.904, "r_y3": 473.452, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 459.876, "t": 437.723, "r": 465.881, "b": 447.687, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.876, "r_y0": 447.687, "r_x1": 465.881, "r_y1": 447.687, "r_x2": 465.881, "r_y2": 437.723, "r_x3": 459.876, "r_y3": 437.723, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 11, "label": "table", "bbox": {"l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT"}, "confidence": 0.8056110739707947, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 446.213, "r_x1": 351.641, "r_y1": 446.213, "r_x2": 351.641, "r_y2": 438.459, "r_x3": 347.249, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.881, "r_y0": 446.213, "r_x1": 323.273, "r_y1": 446.213, "r_x2": 323.273, "r_y2": 438.459, "r_x3": 318.881, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 446.213, "r_x1": 398.497, "r_y1": 446.213, "r_x2": 398.497, "r_y2": 438.459, "r_x3": 394.104, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 458.073, "r_x1": 323.166, "r_y1": 458.073, "r_x2": 323.166, "r_y2": 450.319, "r_x3": 318.773, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 458.073, "r_x1": 351.641, "r_y1": 458.073, "r_x2": 351.641, "r_y2": 450.319, "r_x3": 347.249, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 458.073, "r_x1": 398.497, "r_y1": 458.073, "r_x2": 398.497, "r_y2": 450.319, "r_x3": 394.104, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 458.073, "r_x1": 445.352, "r_y1": 458.073, "r_x2": 445.352, "r_y2": 450.319, "r_x3": 440.959, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 458.073, "r_x1": 492.207, "r_y1": 458.073, "r_x2": 492.207, "r_y2": 450.319, "r_x3": 487.815, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 482.232, "r_x1": 323.166, "r_y1": 482.232, "r_x2": 323.166, "r_y2": 474.477, "r_x3": 318.773, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 470.372, "r_x1": 351.641, "r_y1": 470.372, "r_x2": 351.641, "r_y2": 462.618, "r_x3": 347.249, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 470.372, "r_x1": 402.888, "r_y1": 470.372, "r_x2": 402.888, "r_y2": 462.618, "r_x3": 394.104, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 470.372, "r_x1": 449.423, "r_y1": 470.372, "r_x2": 449.423, "r_y2": 462.618, "r_x3": 440.959, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 470.372, "r_x1": 496.599, "r_y1": 470.372, "r_x2": 496.599, "r_y2": 462.618, "r_x3": 487.815, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 482.232, "r_x1": 356.033, "r_y1": 482.232, "r_x2": 356.033, "r_y2": 474.477, "r_x3": 347.249, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 482.232, "r_x1": 402.888, "r_y1": 482.232, "r_x2": 402.888, "r_y2": 474.477, "r_x3": 394.104, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 482.232, "r_x1": 449.743, "r_y1": 482.232, "r_x2": 449.743, "r_y2": 474.477, "r_x3": 440.959, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 482.232, "r_x1": 496.599, "r_y1": 482.232, "r_x2": 496.599, "r_y2": 474.477, "r_x3": 487.815, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 493.652, "r_x1": 356.033, "r_y1": 493.652, "r_x2": 356.033, "r_y2": 485.898, "r_x3": 347.249, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 493.652, "r_x1": 402.888, "r_y1": 493.652, "r_x2": 402.888, "r_y2": 485.898, "r_x3": 394.104, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 493.652, "r_x1": 449.743, "r_y1": 493.652, "r_x2": 449.743, "r_y2": 485.898, "r_x3": 440.959, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 493.652, "r_x1": 496.599, "r_y1": 493.652, "r_x2": 496.599, "r_y2": 485.898, "r_x3": 487.815, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.701, "r_y0": 459.214, "r_x1": 372.706, "r_y1": 459.214, "r_x2": 372.706, "r_y2": 449.25, "r_x3": 366.701, "r_y3": 449.25, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.904, "r_y0": 483.416, "r_x1": 337.909, "r_y1": 483.416, "r_x2": 337.909, "r_y2": 473.452, "r_x3": 331.904, "r_y3": 473.452, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.876, "r_y0": 447.687, "r_x1": 465.881, "r_y1": 447.687, "r_x2": 465.881, "r_y2": 437.723, "r_x3": 459.876, "r_y3": 437.723, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 61, "label": "text", "bbox": {"l": 347.249, "t": 438.459, "r": 351.641, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 446.213, "r_x1": 351.641, "r_y1": 446.213, "r_x2": 351.641, "r_y2": 438.459, "r_x3": 347.249, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 318.881, "t": 438.459, "r": 323.273, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.881, "r_y0": 446.213, "r_x1": 323.273, "r_y1": 446.213, "r_x2": 323.273, "r_y2": 438.459, "r_x3": 318.881, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 394.104, "t": 438.459, "r": 398.497, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 446.213, "r_x1": 398.497, "r_y1": 446.213, "r_x2": 398.497, "r_y2": 438.459, "r_x3": 394.104, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 318.773, "t": 450.319, "r": 323.166, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 458.073, "r_x1": 323.166, "r_y1": 458.073, "r_x2": 323.166, "r_y2": 450.319, "r_x3": 318.773, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 347.249, "t": 450.319, "r": 351.641, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 458.073, "r_x1": 351.641, "r_y1": 458.073, "r_x2": 351.641, "r_y2": 450.319, "r_x3": 347.249, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 394.104, "t": 450.319, "r": 398.497, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 458.073, "r_x1": 398.497, "r_y1": 458.073, "r_x2": 398.497, "r_y2": 450.319, "r_x3": 394.104, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 440.959, "t": 450.319, "r": 445.352, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 458.073, "r_x1": 445.352, "r_y1": 458.073, "r_x2": 445.352, "r_y2": 450.319, "r_x3": 440.959, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 487.815, "t": 450.319, "r": 492.207, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 458.073, "r_x1": 492.207, "r_y1": 458.073, "r_x2": 492.207, "r_y2": 450.319, "r_x3": 487.815, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 318.773, "t": 474.477, "r": 323.166, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 482.232, "r_x1": 323.166, "r_y1": 482.232, "r_x2": 323.166, "r_y2": 474.477, "r_x3": 318.773, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 347.249, "t": 462.618, "r": 351.641, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 470.372, "r_x1": 351.641, "r_y1": 470.372, "r_x2": 351.641, "r_y2": 462.618, "r_x3": 347.249, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 394.104, "t": 462.618, "r": 402.888, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 470.372, "r_x1": 402.888, "r_y1": 470.372, "r_x2": 402.888, "r_y2": 462.618, "r_x3": 394.104, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 440.959, "t": 462.618, "r": 449.423, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 470.372, "r_x1": 449.423, "r_y1": 470.372, "r_x2": 449.423, "r_y2": 462.618, "r_x3": 440.959, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 487.815, "t": 462.618, "r": 496.599, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 470.372, "r_x1": 496.599, "r_y1": 470.372, "r_x2": 496.599, "r_y2": 462.618, "r_x3": 487.815, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 347.249, "t": 474.477, "r": 356.033, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 482.232, "r_x1": 356.033, "r_y1": 482.232, "r_x2": 356.033, "r_y2": 474.477, "r_x3": 347.249, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 394.104, "t": 474.477, "r": 402.888, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 482.232, "r_x1": 402.888, "r_y1": 482.232, "r_x2": 402.888, "r_y2": 474.477, "r_x3": 394.104, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 440.959, "t": 474.477, "r": 449.743, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 482.232, "r_x1": 449.743, "r_y1": 482.232, "r_x2": 449.743, "r_y2": 474.477, "r_x3": 440.959, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 487.815, "t": 474.477, "r": 496.599, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 482.232, "r_x1": 496.599, "r_y1": 482.232, "r_x2": 496.599, "r_y2": 474.477, "r_x3": 487.815, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 347.249, "t": 485.898, "r": 356.033, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 493.652, "r_x1": 356.033, "r_y1": 493.652, "r_x2": 356.033, "r_y2": 485.898, "r_x3": 347.249, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 394.104, "t": 485.898, "r": 402.888, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 493.652, "r_x1": 402.888, "r_y1": 493.652, "r_x2": 402.888, "r_y2": 485.898, "r_x3": 394.104, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 440.959, "t": 485.898, "r": 449.743, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 493.652, "r_x1": 449.743, "r_y1": 493.652, "r_x2": 449.743, "r_y2": 485.898, "r_x3": 440.959, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 487.815, "t": 485.898, "r": 496.599, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 493.652, "r_x1": 496.599, "r_y1": 493.652, "r_x2": 496.599, "r_y2": 485.898, "r_x3": 487.815, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 366.701, "t": 449.25, "r": 372.706, "b": 459.214, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.701, "r_y0": 459.214, "r_x1": 372.706, "r_y1": 459.214, "r_x2": 372.706, "r_y2": 449.25, "r_x3": 366.701, "r_y3": 449.25, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 331.904, "t": 473.452, "r": 337.909, "b": 483.416, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.904, "r_y0": 483.416, "r_x1": 337.909, "r_y1": 483.416, "r_x2": 337.909, "r_y2": 473.452, "r_x3": 331.904, "r_y3": 473.452, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 459.876, "t": 437.723, "r": 465.881, "b": 447.687, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.876, "r_y0": 447.687, "r_x1": 465.881, "r_y1": 447.687, "r_x2": 465.881, "r_y2": 437.723, "r_x3": 459.876, "r_y3": 437.723, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 16, "label": "picture", "bbox": {"l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT"}, "confidence": 0.608779788017273, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.946, "r_y0": 245.44000000000005, "r_x1": 457.951, "r_y1": 245.44000000000005, "r_x2": 457.951, "r_y2": 235.47699999999998, "r_x3": 451.946, "r_y3": 235.47699999999998, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.197, "r_y0": 279.446, "r_x1": 337.202, "r_y1": 279.446, "r_x2": 337.202, "r_y2": 269.48199999999997, "r_x3": 331.197, "r_y3": 269.48199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.033, "r_y0": 262.77200000000005, "r_x1": 390.038, "r_y1": 262.77200000000005, "r_x2": 390.038, "r_y2": 252.80899999999997, "r_x3": 384.033, "r_y3": 252.80899999999997, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 82, "label": "text", "bbox": {"l": 451.946, "t": 235.47699999999998, "r": 457.951, "b": 245.44000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.946, "r_y0": 245.44000000000005, "r_x1": 457.951, "r_y1": 245.44000000000005, "r_x2": 457.951, "r_y2": 235.47699999999998, "r_x3": 451.946, "r_y3": 235.47699999999998, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 331.197, "t": 269.48199999999997, "r": 337.202, "b": 279.446, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.197, "r_y0": 279.446, "r_x1": 337.202, "r_y1": 279.446, "r_x2": 337.202, "r_y2": 269.48199999999997, "r_x3": 331.197, "r_y3": 269.48199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 384.033, "t": 252.80899999999997, "r": 390.038, "b": 262.77200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.033, "r_y0": 262.77200000000005, "r_x1": 390.038, "r_y1": 262.77200000000005, "r_x2": 390.038, "r_y2": 252.80899999999997, "r_x3": 384.033, "r_y3": 252.80899999999997, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 15, "label": "table", "bbox": {"l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT"}, "confidence": 0.6515864729881287, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.946, "r_y0": 245.44000000000005, "r_x1": 457.951, "r_y1": 245.44000000000005, "r_x2": 457.951, "r_y2": 235.47699999999998, "r_x3": 451.946, "r_y3": 235.47699999999998, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.197, "r_y0": 279.446, "r_x1": 337.202, "r_y1": 279.446, "r_x2": 337.202, "r_y2": 269.48199999999997, "r_x3": 331.197, "r_y3": 269.48199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.033, "r_y0": 262.77200000000005, "r_x1": 390.038, "r_y1": 262.77200000000005, "r_x2": 390.038, "r_y2": 252.80899999999997, "r_x3": 384.033, "r_y3": 252.80899999999997, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 82, "label": "text", "bbox": {"l": 451.946, "t": 235.47699999999998, "r": 457.951, "b": 245.44000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.946, "r_y0": 245.44000000000005, "r_x1": 457.951, "r_y1": 245.44000000000005, "r_x2": 457.951, "r_y2": 235.47699999999998, "r_x3": 451.946, "r_y3": 235.47699999999998, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 331.197, "t": 269.48199999999997, "r": 337.202, "b": 279.446, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.197, "r_y0": 279.446, "r_x1": 337.202, "r_y1": 279.446, "r_x2": 337.202, "r_y2": 269.48199999999997, "r_x3": 331.197, "r_y3": 269.48199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 384.033, "t": 252.80899999999997, "r": 390.038, "b": 262.77200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.033, "r_y0": 262.77200000000005, "r_x1": 390.038, "r_y1": 262.77200000000005, "r_x2": 390.038, "r_y2": 252.80899999999997, "r_x3": 384.033, "r_y3": 252.80899999999997, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 6, "label": "caption", "bbox": {"l": 308.862, "t": 514.769, "r": 545.115, "b": 559.187, "coord_origin": "TOPLEFT"}, "confidence": 0.9214619398117065, "cells": [{"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 523.321, "r_x1": 345.734, "r_y1": 523.321, "r_x2": 345.734, "r_y2": 514.769, "r_x3": 308.862, "r_y3": 514.769, "coord_origin": "TOPLEFT"}, "text": "Figure 1:", "orig": "Figure 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 353.176, "r_y0": 523.321, "r_x1": 545.115, "r_y1": 523.321, "r_x2": 545.115, "r_y2": 514.769, "r_x3": 353.176, "r_y3": 514.769, "coord_origin": "TOPLEFT"}, "text": "Picture of a table with subtle, complex features", "orig": "Picture of a table with subtle, complex features", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 535.2760000000001, "r_x1": 545.115, "r_y1": 535.2760000000001, "r_x2": 545.115, "r_y2": 526.7239999999999, "r_x3": 308.862, "r_y3": 526.7239999999999, "coord_origin": "TOPLEFT"}, "text": "such as (1) multi-column headers, (2) cell with multi-row", "orig": "such as (1) multi-column headers, (2) cell with multi-row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 547.231, "r_x1": 445.539, "r_y1": 547.231, "r_x2": 445.539, "r_y2": 538.679, "r_x3": 308.862, "r_y3": 538.679, "coord_origin": "TOPLEFT"}, "text": "text and (3) cells with no content.", "orig": "text and (3) cells with no content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.221, "r_y0": 547.231, "r_x1": 545.115, "r_y1": 547.231, "r_x2": 545.115, "r_y2": 538.679, "r_x3": 450.221, "r_y3": 538.679, "coord_origin": "TOPLEFT"}, "text": "Image from PubTabNet", "orig": "Image from PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 559.187, "r_x1": 505.692, "r_y1": 559.187, "r_x2": 505.692, "r_y2": 550.635, "r_x3": 308.862, "r_y3": 550.635, "coord_origin": "TOPLEFT"}, "text": "evaluation set, filename: 'PMC2944238 004 02'.", "orig": "evaluation set, filename: 'PMC2944238 004 02'.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 308.862, "t": 584.678, "r": 545.115, "b": 664.961, "coord_origin": "TOPLEFT"}, "confidence": 0.9848759770393372, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 593.23, "r_x1": 358.077, "r_y1": 593.23, "r_x2": 358.077, "r_y2": 584.678, "r_x3": 320.817, "r_y3": 584.678, "coord_origin": "TOPLEFT"}, "text": "Recently,", "orig": "Recently,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.62, "r_y0": 593.23, "r_x1": 404.134, "r_y1": 593.23, "r_x2": 404.134, "r_y2": 584.678, "r_x3": 362.62, "r_y3": 584.678, "coord_origin": "TOPLEFT"}, "text": "significant", "orig": "significant", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.259, "r_y0": 593.23, "r_x1": 545.115, "r_y1": 593.23, "r_x2": 545.115, "r_y2": 584.678, "r_x3": 408.259, "r_y3": 584.678, "coord_origin": "TOPLEFT"}, "text": "progress has been made with vi-", "orig": "progress has been made with vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.185, "r_x1": 526.365, "r_y1": 605.185, "r_x2": 526.365, "r_y2": 596.633, "r_x3": 308.862, "r_y3": 596.633, "coord_origin": "TOPLEFT"}, "text": "sion based approaches to extract tables in documents.", "orig": "sion based approaches to extract tables in documents.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 531.426, "r_y0": 605.185, "r_x1": 545.115, "r_y1": 605.185, "r_x2": 545.115, "r_y2": 596.633, "r_x3": 531.426, "r_y3": 596.633, "coord_origin": "TOPLEFT"}, "text": "For", "orig": "For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.14, "r_x1": 545.115, "r_y1": 617.14, "r_x2": 545.115, "r_y2": 608.588, "r_x3": 308.862, "r_y3": 608.588, "coord_origin": "TOPLEFT"}, "text": "the sake of completeness, the issue of table extraction from", "orig": "the sake of completeness, the issue of table extraction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.095, "r_x1": 545.115, "r_y1": 629.095, "r_x2": 545.115, "r_y2": 620.543, "r_x3": 308.862, "r_y3": 620.543, "coord_origin": "TOPLEFT"}, "text": "documents is typically decomposed into two separate chal-", "orig": "documents is typically decomposed into two separate chal-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.0509999999999, "r_x1": 336.807, "r_y1": 641.0509999999999, "r_x2": 336.807, "r_y2": 632.499, "r_x3": 308.862, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "lenges,", "orig": "lenges,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.519, "r_y0": 641.0509999999999, "r_x1": 353.694, "r_y1": 641.0509999999999, "r_x2": 353.694, "r_y2": 632.499, "r_x3": 341.519, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "i.e.", "orig": "i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.112, "r_y0": 641.0509999999999, "r_x1": 373.728, "r_y1": 641.0509999999999, "r_x2": 373.728, "r_y2": 632.499, "r_x3": 362.112, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.992, "r_y0": 641.0509999999999, "r_x1": 406.226, "r_y1": 641.0509999999999, "r_x2": 406.226, "r_y2": 632.499, "r_x3": 377.992, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "finding", "orig": "finding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.5, "r_y0": 641.0509999999999, "r_x1": 422.675, "r_y1": 641.0509999999999, "r_x2": 422.675, "r_y2": 632.499, "r_x3": 410.5, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.939, "r_y0": 641.0509999999999, "r_x1": 459.038, "r_y1": 641.0509999999999, "r_x2": 459.038, "r_y2": 632.499, "r_x3": 426.939, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "location", "orig": "location", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.302, "r_y0": 641.0509999999999, "r_x1": 471.601, "r_y1": 641.0509999999999, "r_x2": 471.601, "r_y2": 632.499, "r_x3": 463.302, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.875, "r_y0": 641.0509999999999, "r_x1": 488.049, "r_y1": 641.0509999999999, "r_x2": 488.049, "r_y2": 632.499, "r_x3": 475.875, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 492.313, "r_y0": 641.0509999999999, "r_x1": 522.191, "r_y1": 641.0509999999999, "r_x2": 522.191, "r_y2": 632.499, "r_x3": 492.313, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "table(s)", "orig": "table(s)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 526.455, "r_y0": 641.0509999999999, "r_x1": 545.115, "r_y1": 641.0509999999999, "r_x2": 545.115, "r_y2": 632.499, "r_x3": 526.455, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "on a", "orig": "on a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.006, "r_x1": 545.115, "r_y1": 653.006, "r_x2": 545.115, "r_y2": 644.454, "r_x3": 308.862, "r_y3": 644.454, "coord_origin": "TOPLEFT"}, "text": "document-page and (2) finding the structure of a given table", "orig": "document-page and (2) finding the structure of a given table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 664.961, "r_x1": 375.552, "r_y1": 664.961, "r_x2": 375.552, "r_y2": 656.409, "r_x3": 308.862, "r_y3": 656.409, "coord_origin": "TOPLEFT"}, "text": "in the document.", "orig": "in the document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 308.862, "t": 668.649, "r": 545.115, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.979152262210846, "cells": [{"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 320.817, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "The first problem is called table-location and has been", "orig": "The first problem is called table-location and has been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 308.862, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 474.261, "r_y1": 701.111, "r_x2": 474.261, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "of-the-art object-detection networks (e.g.", "orig": "of-the-art object-detection networks (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 479.342, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 479.342, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "YOLO and later", "orig": "YOLO and later", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 395.796, "r_y1": 713.066, "r_x2": 395.796, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "on Mask-RCNN [9]).", "orig": "on Mask-RCNN [9]).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.046, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 401.046, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "For all practical purposes, it can be", "orig": "For all practical purposes, it can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8045893311500549, "cells": [{"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "page_header", "bbox": {"l": 18.34, "t": 210.0, "r": 36.34, "b": 560.0, "coord_origin": "TOPLEFT"}, "confidence": 0.8773143887519836, "cells": [{"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 560.0, "r_x1": 36.34, "r_y1": 380.0, "r_x2": 18.34, "r_y2": 380.0, "r_x3": 18.34, "r_y3": 560.0, "coord_origin": "TOPLEFT"}, "text": "arXiv:2203.01017v2", "orig": "arXiv:2203.01017v2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 360.0, "r_x1": 36.34, "r_y1": 290.0, "r_x2": 18.34, "r_y2": 290.0, "r_x3": 18.34, "r_y3": 360.0, "coord_origin": "TOPLEFT"}, "text": "[cs.CV]", "orig": "[cs.CV]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 270.0, "r_x1": 36.34, "r_y1": 250.0, "r_x2": 18.34, "r_y2": 250.0, "r_x3": 18.34, "r_y3": 270.0, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 240.0, "r_x1": 36.34, "r_y1": 210.0, "r_x2": 18.34, "r_y2": 210.0, "r_x3": 18.34, "r_y3": 240.0, "coord_origin": "TOPLEFT"}, "text": "Mar", "orig": "Mar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 91, "label": "text", "bbox": {"l": 18.34, "t": 160.0, "r": 36.34, "b": 200.0, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 200.0, "r_x1": 36.34, "r_y1": 160.0, "r_x2": 18.34, "r_y2": 160.0, "r_x3": 18.34, "r_y3": 200.0, "coord_origin": "TOPLEFT"}, "text": "2022", "orig": "2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {"11": {"label": "table", "id": 11, "page_no": 0, "cluster": {"id": 11, "label": "table", "bbox": {"l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT"}, "confidence": 0.8056110739707947, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 446.213, "r_x1": 351.641, "r_y1": 446.213, "r_x2": 351.641, "r_y2": 438.459, "r_x3": 347.249, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.881, "r_y0": 446.213, "r_x1": 323.273, "r_y1": 446.213, "r_x2": 323.273, "r_y2": 438.459, "r_x3": 318.881, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 446.213, "r_x1": 398.497, "r_y1": 446.213, "r_x2": 398.497, "r_y2": 438.459, "r_x3": 394.104, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 458.073, "r_x1": 323.166, "r_y1": 458.073, "r_x2": 323.166, "r_y2": 450.319, "r_x3": 318.773, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 458.073, "r_x1": 351.641, "r_y1": 458.073, "r_x2": 351.641, "r_y2": 450.319, "r_x3": 347.249, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 458.073, "r_x1": 398.497, "r_y1": 458.073, "r_x2": 398.497, "r_y2": 450.319, "r_x3": 394.104, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 458.073, "r_x1": 445.352, "r_y1": 458.073, "r_x2": 445.352, "r_y2": 450.319, "r_x3": 440.959, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 458.073, "r_x1": 492.207, "r_y1": 458.073, "r_x2": 492.207, "r_y2": 450.319, "r_x3": 487.815, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 482.232, "r_x1": 323.166, "r_y1": 482.232, "r_x2": 323.166, "r_y2": 474.477, "r_x3": 318.773, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 470.372, "r_x1": 351.641, "r_y1": 470.372, "r_x2": 351.641, "r_y2": 462.618, "r_x3": 347.249, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 470.372, "r_x1": 402.888, "r_y1": 470.372, "r_x2": 402.888, "r_y2": 462.618, "r_x3": 394.104, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 470.372, "r_x1": 449.423, "r_y1": 470.372, "r_x2": 449.423, "r_y2": 462.618, "r_x3": 440.959, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 470.372, "r_x1": 496.599, "r_y1": 470.372, "r_x2": 496.599, "r_y2": 462.618, "r_x3": 487.815, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 482.232, "r_x1": 356.033, "r_y1": 482.232, "r_x2": 356.033, "r_y2": 474.477, "r_x3": 347.249, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 482.232, "r_x1": 402.888, "r_y1": 482.232, "r_x2": 402.888, "r_y2": 474.477, "r_x3": 394.104, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 482.232, "r_x1": 449.743, "r_y1": 482.232, "r_x2": 449.743, "r_y2": 474.477, "r_x3": 440.959, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 482.232, "r_x1": 496.599, "r_y1": 482.232, "r_x2": 496.599, "r_y2": 474.477, "r_x3": 487.815, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 493.652, "r_x1": 356.033, "r_y1": 493.652, "r_x2": 356.033, "r_y2": 485.898, "r_x3": 347.249, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 493.652, "r_x1": 402.888, "r_y1": 493.652, "r_x2": 402.888, "r_y2": 485.898, "r_x3": 394.104, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 493.652, "r_x1": 449.743, "r_y1": 493.652, "r_x2": 449.743, "r_y2": 485.898, "r_x3": 440.959, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 493.652, "r_x1": 496.599, "r_y1": 493.652, "r_x2": 496.599, "r_y2": 485.898, "r_x3": 487.815, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.701, "r_y0": 459.214, "r_x1": 372.706, "r_y1": 459.214, "r_x2": 372.706, "r_y2": 449.25, "r_x3": 366.701, "r_y3": 449.25, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.904, "r_y0": 483.416, "r_x1": 337.909, "r_y1": 483.416, "r_x2": 337.909, "r_y2": 473.452, "r_x3": 331.904, "r_y3": 473.452, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.876, "r_y0": 447.687, "r_x1": 465.881, "r_y1": 447.687, "r_x2": 465.881, "r_y2": 437.723, "r_x3": 459.876, "r_y3": 437.723, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 61, "label": "text", "bbox": {"l": 347.249, "t": 438.459, "r": 351.641, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 446.213, "r_x1": 351.641, "r_y1": 446.213, "r_x2": 351.641, "r_y2": 438.459, "r_x3": 347.249, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 318.881, "t": 438.459, "r": 323.273, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.881, "r_y0": 446.213, "r_x1": 323.273, "r_y1": 446.213, "r_x2": 323.273, "r_y2": 438.459, "r_x3": 318.881, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 394.104, "t": 438.459, "r": 398.497, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 446.213, "r_x1": 398.497, "r_y1": 446.213, "r_x2": 398.497, "r_y2": 438.459, "r_x3": 394.104, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 318.773, "t": 450.319, "r": 323.166, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 458.073, "r_x1": 323.166, "r_y1": 458.073, "r_x2": 323.166, "r_y2": 450.319, "r_x3": 318.773, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 347.249, "t": 450.319, "r": 351.641, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 458.073, "r_x1": 351.641, "r_y1": 458.073, "r_x2": 351.641, "r_y2": 450.319, "r_x3": 347.249, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 394.104, "t": 450.319, "r": 398.497, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 458.073, "r_x1": 398.497, "r_y1": 458.073, "r_x2": 398.497, "r_y2": 450.319, "r_x3": 394.104, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 440.959, "t": 450.319, "r": 445.352, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 458.073, "r_x1": 445.352, "r_y1": 458.073, "r_x2": 445.352, "r_y2": 450.319, "r_x3": 440.959, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 487.815, "t": 450.319, "r": 492.207, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 458.073, "r_x1": 492.207, "r_y1": 458.073, "r_x2": 492.207, "r_y2": 450.319, "r_x3": 487.815, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 318.773, "t": 474.477, "r": 323.166, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 482.232, "r_x1": 323.166, "r_y1": 482.232, "r_x2": 323.166, "r_y2": 474.477, "r_x3": 318.773, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 347.249, "t": 462.618, "r": 351.641, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 470.372, "r_x1": 351.641, "r_y1": 470.372, "r_x2": 351.641, "r_y2": 462.618, "r_x3": 347.249, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 394.104, "t": 462.618, "r": 402.888, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 470.372, "r_x1": 402.888, "r_y1": 470.372, "r_x2": 402.888, "r_y2": 462.618, "r_x3": 394.104, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 440.959, "t": 462.618, "r": 449.423, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 470.372, "r_x1": 449.423, "r_y1": 470.372, "r_x2": 449.423, "r_y2": 462.618, "r_x3": 440.959, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 487.815, "t": 462.618, "r": 496.599, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 470.372, "r_x1": 496.599, "r_y1": 470.372, "r_x2": 496.599, "r_y2": 462.618, "r_x3": 487.815, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 347.249, "t": 474.477, "r": 356.033, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 482.232, "r_x1": 356.033, "r_y1": 482.232, "r_x2": 356.033, "r_y2": 474.477, "r_x3": 347.249, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 394.104, "t": 474.477, "r": 402.888, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 482.232, "r_x1": 402.888, "r_y1": 482.232, "r_x2": 402.888, "r_y2": 474.477, "r_x3": 394.104, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 440.959, "t": 474.477, "r": 449.743, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 482.232, "r_x1": 449.743, "r_y1": 482.232, "r_x2": 449.743, "r_y2": 474.477, "r_x3": 440.959, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 487.815, "t": 474.477, "r": 496.599, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 482.232, "r_x1": 496.599, "r_y1": 482.232, "r_x2": 496.599, "r_y2": 474.477, "r_x3": 487.815, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 347.249, "t": 485.898, "r": 356.033, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 493.652, "r_x1": 356.033, "r_y1": 493.652, "r_x2": 356.033, "r_y2": 485.898, "r_x3": 347.249, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 394.104, "t": 485.898, "r": 402.888, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 493.652, "r_x1": 402.888, "r_y1": 493.652, "r_x2": 402.888, "r_y2": 485.898, "r_x3": 394.104, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 440.959, "t": 485.898, "r": 449.743, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 493.652, "r_x1": 449.743, "r_y1": 493.652, "r_x2": 449.743, "r_y2": 485.898, "r_x3": 440.959, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 487.815, "t": 485.898, "r": 496.599, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 493.652, "r_x1": 496.599, "r_y1": 493.652, "r_x2": 496.599, "r_y2": 485.898, "r_x3": 487.815, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 366.701, "t": 449.25, "r": 372.706, "b": 459.214, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.701, "r_y0": 459.214, "r_x1": 372.706, "r_y1": 459.214, "r_x2": 372.706, "r_y2": 449.25, "r_x3": 366.701, "r_y3": 449.25, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 331.904, "t": 473.452, "r": 337.909, "b": 483.416, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.904, "r_y0": 483.416, "r_x1": 337.909, "r_y1": 483.416, "r_x2": 337.909, "r_y2": 473.452, "r_x3": 331.904, "r_y3": 473.452, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 459.876, "t": 437.723, "r": 465.881, "b": 447.687, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.876, "r_y0": 447.687, "r_x1": 465.881, "r_y1": 447.687, "r_x2": 465.881, "r_y2": 437.723, "r_x3": 459.876, "r_y3": 437.723, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["fcel", "fcel", "lcel", "lcel", "lcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 5, "num_cols": 5, "table_cells": [{"bbox": {"l": 347.249, "t": 437.723, "r": 465.881, "b": 447.687, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 4, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 5, "text": "1 2 1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 318.881, "t": 438.459, "r": 323.273, "b": 446.213, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 318.773, "t": 450.319, "r": 323.166, "b": 458.073, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 347.249, "t": 449.25, "r": 372.706, "b": 459.214, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4 3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.104, "t": 450.319, "r": 398.497, "b": 458.073, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "5", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 440.959, "t": 450.319, "r": 445.352, "b": 458.073, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "6", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 487.815, "t": 450.319, "r": 492.207, "b": 458.073, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "7", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 318.773, "t": 473.452, "r": 337.909, "b": 483.416, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "8 2", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 347.249, "t": 462.618, "r": 351.641, "b": 470.372, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "9", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.104, "t": 462.618, "r": 402.888, "b": 470.372, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "10", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 440.959, "t": 462.618, "r": 449.423, "b": 470.372, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "11", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 487.815, "t": 462.618, "r": 496.599, "b": 470.372, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "12", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 347.249, "t": 474.477, "r": 356.033, "b": 482.232, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "13", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.104, "t": 474.477, "r": 402.888, "b": 482.232, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "14", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 440.959, "t": 474.477, "r": 449.743, "b": 482.232, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "15", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 487.815, "t": 474.477, "r": 496.599, "b": 482.232, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "16", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 347.249, "t": 485.898, "r": 356.033, "b": 493.652, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "17", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.104, "t": 485.898, "r": 402.888, "b": 493.652, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "18", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 440.959, "t": 485.898, "r": 449.743, "b": 493.652, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "19", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 487.815, "t": 485.898, "r": 496.599, "b": 493.652, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "20", "column_header": false, "row_header": false, "row_section": false}]}, "15": {"label": "table", "id": 15, "page_no": 0, "cluster": {"id": 15, "label": "table", "bbox": {"l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT"}, "confidence": 0.6515864729881287, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.946, "r_y0": 245.44000000000005, "r_x1": 457.951, "r_y1": 245.44000000000005, "r_x2": 457.951, "r_y2": 235.47699999999998, "r_x3": 451.946, "r_y3": 235.47699999999998, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.197, "r_y0": 279.446, "r_x1": 337.202, "r_y1": 279.446, "r_x2": 337.202, "r_y2": 269.48199999999997, "r_x3": 331.197, "r_y3": 269.48199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.033, "r_y0": 262.77200000000005, "r_x1": 390.038, "r_y1": 262.77200000000005, "r_x2": 390.038, "r_y2": 252.80899999999997, "r_x3": 384.033, "r_y3": 252.80899999999997, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 82, "label": "text", "bbox": {"l": 451.946, "t": 235.47699999999998, "r": 457.951, "b": 245.44000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.946, "r_y0": 245.44000000000005, "r_x1": 457.951, "r_y1": 245.44000000000005, "r_x2": 457.951, "r_y2": 235.47699999999998, "r_x3": 451.946, "r_y3": 235.47699999999998, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 331.197, "t": 269.48199999999997, "r": 337.202, "b": 279.446, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.197, "r_y0": 279.446, "r_x1": 337.202, "r_y1": 279.446, "r_x2": 337.202, "r_y2": 269.48199999999997, "r_x3": 331.197, "r_y3": 269.48199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 384.033, "t": 252.80899999999997, "r": 390.038, "b": 262.77200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.033, "r_y0": 262.77200000000005, "r_x1": 390.038, "r_y1": 262.77200000000005, "r_x2": 390.038, "r_y2": 252.80899999999997, "r_x3": 384.033, "r_y3": 252.80899999999997, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 1, "num_cols": 1, "table_cells": [{"bbox": {"l": 451.946, "t": 235.47699999999998, "r": 457.951, "b": 245.44000000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "1", "column_header": true, "row_header": false, "row_section": false}]}}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "section_header", "id": 8, "page_no": 0, "cluster": {"id": 8, "label": "section_header", "bbox": {"l": 96.301, "t": 107.03399999999999, "r": 498.927, "b": 119.93100000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8868067860603333, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.301, "r_y0": 119.93100000000004, "r_x1": 498.927, "r_y1": 119.93100000000004, "r_x2": 498.927, "r_y2": 107.03399999999999, "r_x3": 96.301, "r_y3": 107.03399999999999, "coord_origin": "TOPLEFT"}, "text": "TableFormer: Table Structure Understanding with Transformers.", "orig": "TableFormer: Table Structure Understanding with Transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TableFormer: Table Structure Understanding with Transformers."}, {"label": "section_header", "id": 13, "page_no": 0, "cluster": {"id": 13, "label": "section_header", "bbox": {"l": 142.477, "t": 147.00800000000004, "r": 452.75, "b": 171.21699999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.7586215734481812, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.477, "r_y0": 157.26999999999998, "r_x1": 452.75, "r_y1": 157.26999999999998, "r_x2": 452.75, "r_y2": 147.00800000000004, "r_x3": 142.477, "r_y3": 147.00800000000004, "coord_origin": "TOPLEFT"}, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.918, "r_y0": 171.21699999999998, "r_x1": 332.306, "r_y1": 171.21699999999998, "r_x2": 332.306, "r_y2": 160.95500000000004, "r_x3": 262.918, "r_y3": 160.95500000000004, "coord_origin": "TOPLEFT"}, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar IBM Research"}, {"label": "key_value_region", "id": 25, "page_no": 0, "cluster": {"id": 25, "label": "key_value_region", "bbox": {"l": 208.123, "t": 176.562, "r": 378.733, "b": 184.26999999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.4854728579521179, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.123, "r_y0": 184.26999999999998, "r_x1": 212.731, "r_y1": 184.26999999999998, "r_x2": 212.731, "r_y2": 176.562, "r_x3": 208.123, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.73, "r_y0": 183.861, "r_x1": 378.733, "r_y1": 183.861, "r_x2": 378.733, "r_y2": 177.692, "r_x3": 212.73, "r_y3": 177.692, "coord_origin": "TOPLEFT"}, "text": "ahn,nli,mly,taa @zurich.ibm.com", "orig": "ahn,nli,mly,taa @zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.428, "r_y0": 184.26999999999998, "r_x1": 298.036, "r_y1": 184.26999999999998, "r_x2": 298.036, "r_y2": 176.562, "r_x3": 293.428, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 7, "label": "text", "bbox": {"l": 208.123, "t": 176.562, "r": 378.733, "b": 184.26999999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9096331596374512, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.123, "r_y0": 184.26999999999998, "r_x1": 212.731, "r_y1": 184.26999999999998, "r_x2": 212.731, "r_y2": 176.562, "r_x3": 208.123, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.73, "r_y0": 183.861, "r_x1": 378.733, "r_y1": 183.861, "r_x2": 378.733, "r_y2": 177.692, "r_x3": 212.73, "r_y3": 177.692, "coord_origin": "TOPLEFT"}, "text": "ahn,nli,mly,taa @zurich.ibm.com", "orig": "ahn,nli,mly,taa @zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.428, "r_y0": 184.26999999999998, "r_x1": 298.036, "r_y1": 184.26999999999998, "r_x2": 298.036, "r_y2": 176.562, "r_x3": 293.428, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null}, {"label": "section_header", "id": 5, "page_no": 0, "cluster": {"id": 5, "label": "section_header", "bbox": {"l": 145.995, "t": 215.48299999999995, "r": 190.48, "b": 226.231, "coord_origin": "TOPLEFT"}, "confidence": 0.9258671402931213, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.995, "r_y0": 226.231, "r_x1": 190.48, "r_y1": 226.231, "r_x2": 190.48, "r_y2": 215.48299999999995, "r_x3": 145.995, "r_y3": 215.48299999999995, "coord_origin": "TOPLEFT"}, "text": "Abstract", "orig": "Abstract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Abstract"}, {"label": "text", "id": 2, "page_no": 0, "cluster": {"id": 2, "label": "text", "bbox": {"l": 50.112, "t": 241.39499999999998, "r": 286.365, "b": 512.9970000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9838882088661194, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 249.98299999999995, "r_x1": 286.365, "r_y1": 249.98299999999995, "r_x2": 286.365, "r_y2": 241.39499999999998, "r_x3": 62.067, "r_y3": 241.39499999999998, "coord_origin": "TOPLEFT"}, "text": "Tables organize valuable content in a concise and com-", "orig": "Tables organize valuable content in a concise and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 261.938, "r_x1": 130.062, "r_y1": 261.938, "r_x2": 130.062, "r_y2": 253.35000000000002, "r_x3": 50.112, "r_y3": 253.35000000000002, "coord_origin": "TOPLEFT"}, "text": "pact representation.", "orig": "pact representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.475, "r_y0": 261.938, "r_x1": 286.365, "r_y1": 261.938, "r_x2": 286.365, "r_y2": 253.35000000000002, "r_x3": 134.475, "r_y3": 253.35000000000002, "coord_origin": "TOPLEFT"}, "text": "This content is extremely valuable for", "orig": "This content is extremely valuable for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 273.89300000000003, "r_x1": 286.365, "r_y1": 273.89300000000003, "r_x2": 286.365, "r_y2": 265.30499999999995, "r_x3": 50.112, "r_y3": 265.30499999999995, "coord_origin": "TOPLEFT"}, "text": "systems such as search engines, Knowledge Graph's, etc,", "orig": "systems such as search engines, Knowledge Graph's, etc,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 285.849, "r_x1": 245.18, "r_y1": 285.849, "r_x2": 245.18, "r_y2": 277.26099999999997, "r_x3": 50.112, "r_y3": 277.26099999999997, "coord_origin": "TOPLEFT"}, "text": "since they enhance their predictive capabilities.", "orig": "since they enhance their predictive capabilities.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.496, "r_y0": 285.849, "r_x1": 286.365, "r_y1": 285.849, "r_x2": 286.365, "r_y2": 277.26099999999997, "r_x3": 251.496, "r_y3": 277.26099999999997, "coord_origin": "TOPLEFT"}, "text": "Unfortu-", "orig": "Unfortu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 297.804, "r_x1": 286.365, "r_y1": 297.804, "r_x2": 286.365, "r_y2": 289.216, "r_x3": 50.112, "r_y3": 289.216, "coord_origin": "TOPLEFT"}, "text": "nately, tables come in a large variety of shapes and sizes.", "orig": "nately, tables come in a large variety of shapes and sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 309.759, "r_x1": 103.601, "r_y1": 309.759, "r_x2": 103.601, "r_y2": 301.171, "r_x3": 50.112, "r_y3": 301.171, "coord_origin": "TOPLEFT"}, "text": "Furthermore,", "orig": "Furthermore,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 108.393, "r_y0": 309.759, "r_x1": 124.692, "r_y1": 309.759, "r_x2": 124.692, "r_y2": 301.171, "r_x3": 108.393, "r_y3": 301.171, "coord_origin": "TOPLEFT"}, "text": "they", "orig": "they", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.026, "r_y0": 309.759, "r_x1": 286.365, "r_y1": 309.759, "r_x2": 286.365, "r_y2": 301.171, "r_x3": 129.026, "r_y3": 301.171, "coord_origin": "TOPLEFT"}, "text": "can have complex column/row-header", "orig": "can have complex column/row-header", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 321.714, "r_x1": 286.365, "r_y1": 321.714, "r_x2": 286.365, "r_y2": 313.126, "r_x3": 50.112, "r_y3": 313.126, "coord_origin": "TOPLEFT"}, "text": "configurations, multiline rows, different variety of separa-", "orig": "configurations, multiline rows, different variety of separa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 333.669, "r_x1": 175.123, "r_y1": 333.669, "r_x2": 175.123, "r_y2": 325.081, "r_x3": 50.112, "r_y3": 325.081, "coord_origin": "TOPLEFT"}, "text": "tion lines, missing entries, etc.", "orig": "tion lines, missing entries, etc.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.931, "r_y0": 333.669, "r_x1": 286.365, "r_y1": 333.669, "r_x2": 286.365, "r_y2": 325.081, "r_x3": 180.931, "r_y3": 325.081, "coord_origin": "TOPLEFT"}, "text": "As such, the correct iden-", "orig": "As such, the correct iden-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 345.624, "r_x1": 85.539, "r_y1": 345.624, "r_x2": 85.539, "r_y2": 337.036, "r_x3": 50.112, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "tification", "orig": "tification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 89.942, "r_y0": 345.624, "r_x1": 97.693, "r_y1": 345.624, "r_x2": 97.693, "r_y2": 337.036, "r_x3": 89.942, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 102.107, "r_y0": 345.624, "r_x1": 114.281, "r_y1": 345.624, "r_x2": 114.281, "r_y2": 337.036, "r_x3": 102.107, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 118.695, "r_y0": 345.624, "r_x1": 177.534, "r_y1": 345.624, "r_x2": 177.534, "r_y2": 337.036, "r_x3": 118.695, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "table-structure", "orig": "table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.947, "r_y0": 345.624, "r_x1": 286.365, "r_y1": 345.624, "r_x2": 286.365, "r_y2": 337.036, "r_x3": 181.947, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "from an image is a non-", "orig": "from an image is a non-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 357.58, "r_x1": 95.791, "r_y1": 357.58, "r_x2": 95.791, "r_y2": 348.992, "r_x3": 50.112, "r_y3": 348.992, "coord_origin": "TOPLEFT"}, "text": "trivial task.", "orig": "trivial task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 99.746, "r_y0": 357.58, "r_x1": 286.365, "r_y1": 357.58, "r_x2": 286.365, "r_y2": 348.992, "r_x3": 99.746, "r_y3": 348.992, "coord_origin": "TOPLEFT"}, "text": "In this paper, we present a new table-structure", "orig": "In this paper, we present a new table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 369.535, "r_x1": 132.443, "r_y1": 369.535, "r_x2": 132.443, "r_y2": 360.947, "r_x3": 50.112, "r_y3": 360.947, "coord_origin": "TOPLEFT"}, "text": "identification model.", "orig": "identification model.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 136.777, "r_y0": 369.535, "r_x1": 286.365, "r_y1": 369.535, "r_x2": 286.365, "r_y2": 360.947, "r_x3": 136.777, "r_y3": 360.947, "coord_origin": "TOPLEFT"}, "text": "The latter improves the latest end-to-", "orig": "The latter improves the latest end-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 381.49, "r_x1": 170.4, "r_y1": 381.49, "r_x2": 170.4, "r_y2": 372.902, "r_x3": 50.112, "r_y3": 372.902, "coord_origin": "TOPLEFT"}, "text": "end deep learning model (i.e.", "orig": "end deep learning model (i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.248, "r_y0": 381.49, "r_x1": 286.365, "r_y1": 381.49, "r_x2": 286.365, "r_y2": 372.902, "r_x3": 176.248, "r_y3": 372.902, "coord_origin": "TOPLEFT"}, "text": "encoder-dual-decoder from", "orig": "encoder-dual-decoder from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 393.445, "r_x1": 196.572, "r_y1": 393.445, "r_x2": 196.572, "r_y2": 384.857, "r_x3": 50.112, "r_y3": 384.857, "coord_origin": "TOPLEFT"}, "text": "PubTabNet) in two significant ways.", "orig": "PubTabNet) in two significant ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 201.643, "r_y0": 393.445, "r_x1": 286.365, "r_y1": 393.445, "r_x2": 286.365, "r_y2": 384.857, "r_x3": 201.643, "r_y3": 384.857, "coord_origin": "TOPLEFT"}, "text": "First, we introduce a", "orig": "First, we introduce a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 405.4, "r_x1": 232.328, "r_y1": 405.4, "r_x2": 232.328, "r_y2": 396.812, "r_x3": 50.112, "r_y3": 396.812, "coord_origin": "TOPLEFT"}, "text": "new object detection decoder for table-cells.", "orig": "new object detection decoder for table-cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 238.584, "r_y0": 405.4, "r_x1": 286.365, "r_y1": 405.4, "r_x2": 286.365, "r_y2": 396.812, "r_x3": 238.584, "r_y3": 396.812, "coord_origin": "TOPLEFT"}, "text": "In this way,", "orig": "In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 417.355, "r_x1": 286.365, "r_y1": 417.355, "r_x2": 286.365, "r_y2": 408.767, "r_x3": 50.112, "r_y3": 408.767, "coord_origin": "TOPLEFT"}, "text": "we can obtain the content of the table-cells from program-", "orig": "we can obtain the content of the table-cells from program-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 429.311, "r_x1": 286.365, "r_y1": 429.311, "r_x2": 286.365, "r_y2": 420.723, "r_x3": 50.112, "r_y3": 420.723, "coord_origin": "TOPLEFT"}, "text": "matic PDF's directly from the PDF source and avoid the", "orig": "matic PDF's directly from the PDF source and avoid the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 441.266, "r_x1": 207.232, "r_y1": 441.266, "r_x2": 207.232, "r_y2": 432.678, "r_x3": 50.112, "r_y3": 432.678, "coord_origin": "TOPLEFT"}, "text": "training of the custom OCR decoders.", "orig": "training of the custom OCR decoders.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.096, "r_y0": 441.266, "r_x1": 286.365, "r_y1": 441.266, "r_x2": 286.365, "r_y2": 432.678, "r_x3": 214.096, "r_y3": 432.678, "coord_origin": "TOPLEFT"}, "text": "This architectural", "orig": "This architectural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 453.221, "r_x1": 286.365, "r_y1": 453.221, "r_x2": 286.365, "r_y2": 444.633, "r_x3": 50.112, "r_y3": 444.633, "coord_origin": "TOPLEFT"}, "text": "change leads to more accurate table-content extraction and", "orig": "change leads to more accurate table-content extraction and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 465.176, "r_x1": 204.233, "r_y1": 465.176, "r_x2": 204.233, "r_y2": 456.588, "r_x3": 50.112, "r_y3": 456.588, "coord_origin": "TOPLEFT"}, "text": "allows us to tackle non-english tables.", "orig": "allows us to tackle non-english tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.587, "r_y0": 465.176, "r_x1": 286.365, "r_y1": 465.176, "r_x2": 286.365, "r_y2": 456.588, "r_x3": 208.587, "r_y3": 456.588, "coord_origin": "TOPLEFT"}, "text": "Second, we replace", "orig": "Second, we replace", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 477.131, "r_x1": 286.365, "r_y1": 477.131, "r_x2": 286.365, "r_y2": 468.543, "r_x3": 50.112, "r_y3": 468.543, "coord_origin": "TOPLEFT"}, "text": "the LSTM decoders with transformer based decoders. This", "orig": "the LSTM decoders with transformer based decoders. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 489.087, "r_x1": 286.365, "r_y1": 489.087, "r_x2": 286.365, "r_y2": 480.499, "r_x3": 50.112, "r_y3": 480.499, "coord_origin": "TOPLEFT"}, "text": "upgrade improves significantly the previous state-of-the-art", "orig": "upgrade improves significantly the previous state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 501.042, "r_x1": 286.365, "r_y1": 501.042, "r_x2": 286.365, "r_y2": 492.454, "r_x3": 50.112, "r_y3": 492.454, "coord_origin": "TOPLEFT"}, "text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 512.9970000000001, "r_x1": 276.652, "r_y1": 512.9970000000001, "r_x2": 276.652, "r_y2": 504.409, "r_x3": 50.112, "r_y3": 504.409, "coord_origin": "TOPLEFT"}, "text": "simple tables and from 88.7% to 95% on complex tables.", "orig": "simple tables and from 88.7% to 95% on complex tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Tables organize valuable content in a concise and compact representation. This content is extremely valuable for systems such as search engines, Knowledge Graph's, etc, since they enhance their predictive capabilities. Unfortunately, tables come in a large variety of shapes and sizes. Furthermore, they can have complex column/row-header configurations, multiline rows, different variety of separation lines, missing entries, etc. As such, the correct identification of the table-structure from an image is a nontrivial task. In this paper, we present a new table-structure identification model. The latter improves the latest end-toend deep learning model (i.e. encoder-dual-decoder from PubTabNet) in two significant ways. First, we introduce a new object detection decoder for table-cells. In this way, we can obtain the content of the table-cells from programmatic PDF's directly from the PDF source and avoid the training of the custom OCR decoders. This architectural change leads to more accurate table-content extraction and allows us to tackle non-english tables. Second, we replace the LSTM decoders with transformer based decoders. This upgrade improves significantly the previous state-of-the-art tree-editing-distance-score (TEDS) from 91% to 98.5% on simple tables and from 88.7% to 95% on complex tables."}, {"label": "section_header", "id": 4, "page_no": 0, "cluster": {"id": 4, "label": "section_header", "bbox": {"l": 50.112, "t": 539.943, "r": 126.948, "b": 550.691, "coord_origin": "TOPLEFT"}, "confidence": 0.9317677617073059, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 550.691, "r_x1": 126.948, "r_y1": 550.691, "r_x2": 126.948, "r_y2": 539.943, "r_x3": 50.112, "r_y3": 539.943, "coord_origin": "TOPLEFT"}, "text": "1. Introduction", "orig": "1. Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1. Introduction"}, {"label": "text", "id": 1, "page_no": 0, "cluster": {"id": 1, "label": "text", "bbox": {"l": 50.112, "t": 561.052, "r": 286.365, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9841895699501038, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 569.604, "r_x1": 166.266, "r_y1": 569.604, "r_x2": 166.266, "r_y2": 561.052, "r_x3": 62.067, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "The occurrence of tables", "orig": "The occurrence of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.759, "r_y0": 569.604, "r_x1": 178.51, "r_y1": 569.604, "r_x2": 178.51, "r_y2": 561.052, "r_x3": 170.759, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.003, "r_y0": 569.604, "r_x1": 286.365, "r_y1": 569.604, "r_x2": 286.365, "r_y2": 561.052, "r_x3": 183.003, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "documents is ubiquitous.", "orig": "documents is ubiquitous.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 581.559, "r_x1": 286.365, "r_y1": 581.559, "r_x2": 286.365, "r_y2": 573.0070000000001, "r_x3": 50.112, "r_y3": 573.0070000000001, "coord_origin": "TOPLEFT"}, "text": "They often summarise quantitative or factual data, which is", "orig": "They often summarise quantitative or factual data, which is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 593.514, "r_x1": 286.365, "r_y1": 593.514, "r_x2": 286.365, "r_y2": 584.962, "r_x3": 50.112, "r_y3": 584.962, "coord_origin": "TOPLEFT"}, "text": "cumbersome to describe in verbose text but nevertheless ex-", "orig": "cumbersome to describe in verbose text but nevertheless ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 605.47, "r_x1": 119.95, "r_y1": 605.47, "r_x2": 119.95, "r_y2": 596.918, "r_x3": 50.112, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "tremely valuable.", "orig": "tremely valuable.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.778, "r_y0": 605.47, "r_x1": 286.365, "r_y1": 605.47, "r_x2": 286.365, "r_y2": 596.918, "r_x3": 125.778, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "Unfortunately, this compact representa-", "orig": "Unfortunately, this compact representa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 617.425, "r_x1": 286.365, "r_y1": 617.425, "r_x2": 286.365, "r_y2": 608.873, "r_x3": 50.112, "r_y3": 608.873, "coord_origin": "TOPLEFT"}, "text": "tion is often not easy to parse by machines. There are many", "orig": "tion is often not easy to parse by machines. There are many", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 629.38, "r_x1": 286.365, "r_y1": 629.38, "r_x2": 286.365, "r_y2": 620.828, "r_x3": 50.112, "r_y3": 620.828, "coord_origin": "TOPLEFT"}, "text": "implicit conventions used to obtain a compact table repre-", "orig": "implicit conventions used to obtain a compact table repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 641.335, "r_x1": 286.365, "r_y1": 641.335, "r_x2": 286.365, "r_y2": 632.783, "r_x3": 50.112, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "sentation. For example, tables often have complex column-", "orig": "sentation. For example, tables often have complex column-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 653.29, "r_x1": 286.365, "r_y1": 653.29, "r_x2": 286.365, "r_y2": 644.738, "r_x3": 50.112, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "and row-headers in order to reduce duplicated cell content.", "orig": "and row-headers in order to reduce duplicated cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 665.245, "r_x1": 286.365, "r_y1": 665.245, "r_x2": 286.365, "r_y2": 656.693, "r_x3": 50.112, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "Lines of different shapes and sizes are leveraged to separate", "orig": "Lines of different shapes and sizes are leveraged to separate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.201, "r_x1": 286.365, "r_y1": 677.201, "r_x2": 286.365, "r_y2": 668.649, "r_x3": 50.112, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "content or indicate a tree structure. Additionally, tables can", "orig": "content or indicate a tree structure. Additionally, tables can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "also have empty/missing table-entries or multi-row textual", "orig": "also have empty/missing table-entries or multi-row textual", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 101.848, "r_y1": 701.111, "r_x2": 101.848, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "table-entries.", "orig": "table-entries.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 106.261, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 106.261, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Fig. 1 shows a table which presents all these", "orig": "Fig. 1 shows a table which presents all these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 76.403, "r_y1": 713.066, "r_x2": 76.403, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "issues.", "orig": "issues.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The occurrence of tables in documents is ubiquitous. They often summarise quantitative or factual data, which is cumbersome to describe in verbose text but nevertheless extremely valuable. Unfortunately, this compact representation is often not easy to parse by machines. There are many implicit conventions used to obtain a compact table representation. For example, tables often have complex columnand row-headers in order to reduce duplicated cell content. Lines of different shapes and sizes are leveraged to separate content or indicate a tree structure. Additionally, tables can also have empty/missing table-entries or multi-row textual table-entries. Fig. 1 shows a table which presents all these issues."}, {"label": "section_header", "id": 14, "page_no": 0, "cluster": {"id": 14, "label": "section_header", "bbox": {"l": 315.567, "t": 218.34900000000005, "r": 408.441, "b": 226.66200000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.6724023818969727, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 226.66200000000003, "r_x1": 408.441, "r_y1": 226.66200000000003, "r_x2": 408.441, "r_y2": 218.34900000000005, "r_x3": 315.567, "r_y3": 218.34900000000005, "coord_origin": "TOPLEFT"}, "text": "a. Picture of a table:", "orig": "a. Picture of a table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "a. Picture of a table:"}, {"label": "list_item", "id": 17, "page_no": 0, "cluster": {"id": 17, "label": "list_item", "bbox": {"l": 315.567, "t": 314.037, "r": 486.402, "b": 333.15, "coord_origin": "TOPLEFT"}, "confidence": 0.5549328923225403, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 322.35, "r_x1": 486.402, "r_y1": 322.35, "r_x2": 486.402, "r_y2": 314.037, "r_x3": 315.567, "r_y3": 314.037, "coord_origin": "TOPLEFT"}, "text": "b. Red-annotation of bounding boxes,", "orig": "b. Red-annotation of bounding boxes,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.463, "r_y0": 333.15, "r_x1": 472.474, "r_y1": 333.15, "r_x2": 472.474, "r_y2": 324.837, "r_x3": 326.463, "r_y3": 324.837, "coord_origin": "TOPLEFT"}, "text": "Blue-predictions by TableFormer", "orig": "Blue-predictions by TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "b. Red-annotation of bounding boxes, Blue-predictions by TableFormer"}, {"label": "list_item", "id": 18, "page_no": 0, "cluster": {"id": 18, "label": "list_item", "bbox": {"l": 315.567, "t": 420.525, "r": 491.191, "b": 428.838, "coord_origin": "TOPLEFT"}, "confidence": 0.5501358509063721, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 428.838, "r_x1": 491.191, "r_y1": 428.838, "r_x2": 491.191, "r_y2": 420.525, "r_x3": 315.567, "r_y3": 420.525, "coord_origin": "TOPLEFT"}, "text": "c. Structure predicted by TableFormer:", "orig": "c. Structure predicted by TableFormer:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "c. Structure predicted by TableFormer:"}, {"label": "picture", "id": 10, "page_no": 0, "cluster": {"id": 10, "label": "picture", "bbox": {"l": 314.78173828125, "t": 338.0652770996094, "r": 539.1802978515625, "b": 410.0494384765625, "coord_origin": "TOPLEFT"}, "confidence": 0.8742761611938477, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.148, "r_y0": 351.356, "r_x1": 412.54, "r_y1": 351.356, "r_x2": 412.54, "r_y2": 343.601, "r_x3": 408.148, "r_y3": 343.601, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.11, "r_y0": 350.099, "r_x1": 360.503, "r_y1": 350.099, "r_x2": 360.503, "r_y2": 342.345, "r_x3": 356.11, "r_y3": 342.345, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.678, "r_y0": 349.465, "r_x1": 505.07, "r_y1": 349.465, "r_x2": 505.07, "r_y2": 341.711, "r_x3": 500.678, "r_y3": 341.711, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.134, "r_y0": 360.275, "r_x1": 360.526, "r_y1": 360.275, "r_x2": 360.526, "r_y2": 352.521, "r_x3": 356.134, "r_y3": 352.521, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 402.54, "r_y0": 364.404, "r_x1": 406.932, "r_y1": 364.404, "r_x2": 406.932, "r_y2": 356.65, "r_x3": 402.54, "r_y3": 356.65, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.582, "r_y0": 361.367, "r_x1": 452.974, "r_y1": 361.367, "r_x2": 452.974, "r_y2": 353.613, "r_x3": 448.582, "r_y3": 353.613, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 491.652, "r_y0": 362.234, "r_x1": 496.044, "r_y1": 362.234, "r_x2": 496.044, "r_y2": 354.48, "r_x3": 491.652, "r_y3": 354.48, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 535.138, "r_y0": 361.867, "r_x1": 539.531, "r_y1": 361.867, "r_x2": 539.531, "r_y2": 354.113, "r_x3": 535.138, "r_y3": 354.113, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.828, "r_y0": 395.625, "r_x1": 353.221, "r_y1": 395.625, "r_x2": 353.221, "r_y2": 387.871, "r_x3": 348.828, "r_y3": 387.871, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 389.272, "r_y0": 383.9, "r_x1": 393.664, "r_y1": 383.9, "r_x2": 393.664, "r_y2": 376.145, "r_x3": 389.272, "r_y3": 376.145, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.675, "r_y0": 384.173, "r_x1": 451.459, "r_y1": 384.173, "r_x2": 451.459, "r_y2": 376.419, "r_x3": 442.675, "r_y3": 376.419, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.438, "r_y0": 384.061, "r_x1": 485.902, "r_y1": 384.061, "r_x2": 485.902, "r_y2": 376.307, "r_x3": 477.438, "r_y3": 376.307, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 522.573, "r_y0": 384.173, "r_x1": 531.357, "r_y1": 384.173, "r_x2": 531.357, "r_y2": 376.419, "r_x3": 522.573, "r_y3": 376.419, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.23, "r_y0": 395.642, "r_x1": 409.014, "r_y1": 395.642, "r_x2": 409.014, "r_y2": 387.887, "r_x3": 400.23, "r_y3": 387.887, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.308, "r_y0": 395.517, "r_x1": 451.092, "r_y1": 395.517, "r_x2": 451.092, "r_y2": 387.763, "r_x3": 442.308, "r_y3": 387.763, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.219, "r_y0": 395.902, "r_x1": 487.003, "r_y1": 395.902, "r_x2": 487.003, "r_y2": 388.148, "r_x3": 478.219, "r_y3": 388.148, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 523.229, "r_y0": 395.517, "r_x1": 532.013, "r_y1": 395.517, "r_x2": 532.013, "r_y2": 387.763, "r_x3": 523.229, "r_y3": 387.763, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.572, "r_y0": 407.952, "r_x1": 420.356, "r_y1": 407.952, "r_x2": 420.356, "r_y2": 400.198, "r_x3": 411.572, "r_y3": 400.198, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.305, "r_y0": 407.564, "r_x1": 451.089, "r_y1": 407.564, "r_x2": 451.089, "r_y2": 399.81, "r_x3": 442.305, "r_y3": 399.81, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.779, "r_y0": 407.524, "r_x1": 487.563, "r_y1": 407.524, "r_x2": 487.563, "r_y2": 399.769, "r_x3": 478.779, "r_y3": 399.769, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 523.972, "r_y0": 407.139, "r_x1": 532.756, "r_y1": 407.139, "r_x2": 532.756, "r_y2": 399.385, "r_x3": 523.972, "r_y3": 399.385, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.094, "r_y0": 367.853, "r_x1": 391.099, "r_y1": 367.853, "r_x2": 391.099, "r_y2": 357.89, "r_x3": 385.094, "r_y3": 357.89, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.435, "r_y0": 390.82, "r_x1": 339.439, "r_y1": 390.82, "r_x2": 339.439, "r_y2": 380.856, "r_x3": 333.435, "r_y3": 380.856, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.072, "r_y0": 351.13, "r_x1": 484.077, "r_y1": 351.13, "r_x2": 484.077, "r_y2": 341.166, "r_x3": 478.072, "r_y3": 341.166, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 40, "label": "text", "bbox": {"l": 408.148, "t": 343.601, "r": 412.54, "b": 351.356, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.148, "r_y0": 351.356, "r_x1": 412.54, "r_y1": 351.356, "r_x2": 412.54, "r_y2": 343.601, "r_x3": 408.148, "r_y3": 343.601, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 356.11, "t": 342.345, "r": 360.503, "b": 350.099, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.11, "r_y0": 350.099, "r_x1": 360.503, "r_y1": 350.099, "r_x2": 360.503, "r_y2": 342.345, "r_x3": 356.11, "r_y3": 342.345, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 500.678, "t": 341.711, "r": 505.07, "b": 349.465, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.678, "r_y0": 349.465, "r_x1": 505.07, "r_y1": 349.465, "r_x2": 505.07, "r_y2": 341.711, "r_x3": 500.678, "r_y3": 341.711, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 356.134, "t": 352.521, "r": 360.526, "b": 360.275, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.134, "r_y0": 360.275, "r_x1": 360.526, "r_y1": 360.275, "r_x2": 360.526, "r_y2": 352.521, "r_x3": 356.134, "r_y3": 352.521, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 402.54, "t": 356.65, "r": 406.932, "b": 364.404, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 402.54, "r_y0": 364.404, "r_x1": 406.932, "r_y1": 364.404, "r_x2": 406.932, "r_y2": 356.65, "r_x3": 402.54, "r_y3": 356.65, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 448.582, "t": 353.613, "r": 452.974, "b": 361.367, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.582, "r_y0": 361.367, "r_x1": 452.974, "r_y1": 361.367, "r_x2": 452.974, "r_y2": 353.613, "r_x3": 448.582, "r_y3": 353.613, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 491.652, "t": 354.48, "r": 496.044, "b": 362.234, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 491.652, "r_y0": 362.234, "r_x1": 496.044, "r_y1": 362.234, "r_x2": 496.044, "r_y2": 354.48, "r_x3": 491.652, "r_y3": 354.48, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 535.138, "t": 354.113, "r": 539.531, "b": 361.867, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 535.138, "r_y0": 361.867, "r_x1": 539.531, "r_y1": 361.867, "r_x2": 539.531, "r_y2": 354.113, "r_x3": 535.138, "r_y3": 354.113, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 348.828, "t": 387.871, "r": 353.221, "b": 395.625, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.828, "r_y0": 395.625, "r_x1": 353.221, "r_y1": 395.625, "r_x2": 353.221, "r_y2": 387.871, "r_x3": 348.828, "r_y3": 387.871, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 389.272, "t": 376.145, "r": 393.664, "b": 383.9, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 389.272, "r_y0": 383.9, "r_x1": 393.664, "r_y1": 383.9, "r_x2": 393.664, "r_y2": 376.145, "r_x3": 389.272, "r_y3": 376.145, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 442.675, "t": 376.419, "r": 451.459, "b": 384.173, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.675, "r_y0": 384.173, "r_x1": 451.459, "r_y1": 384.173, "r_x2": 451.459, "r_y2": 376.419, "r_x3": 442.675, "r_y3": 376.419, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 477.438, "t": 376.307, "r": 485.902, "b": 384.061, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.438, "r_y0": 384.061, "r_x1": 485.902, "r_y1": 384.061, "r_x2": 485.902, "r_y2": 376.307, "r_x3": 477.438, "r_y3": 376.307, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 522.573, "t": 376.419, "r": 531.357, "b": 384.173, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 522.573, "r_y0": 384.173, "r_x1": 531.357, "r_y1": 384.173, "r_x2": 531.357, "r_y2": 376.419, "r_x3": 522.573, "r_y3": 376.419, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 400.23, "t": 387.887, "r": 409.014, "b": 395.642, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.23, "r_y0": 395.642, "r_x1": 409.014, "r_y1": 395.642, "r_x2": 409.014, "r_y2": 387.887, "r_x3": 400.23, "r_y3": 387.887, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 442.308, "t": 387.763, "r": 451.092, "b": 395.517, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.308, "r_y0": 395.517, "r_x1": 451.092, "r_y1": 395.517, "r_x2": 451.092, "r_y2": 387.763, "r_x3": 442.308, "r_y3": 387.763, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 478.219, "t": 388.148, "r": 487.003, "b": 395.902, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.219, "r_y0": 395.902, "r_x1": 487.003, "r_y1": 395.902, "r_x2": 487.003, "r_y2": 388.148, "r_x3": 478.219, "r_y3": 388.148, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 523.229, "t": 387.763, "r": 532.013, "b": 395.517, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 523.229, "r_y0": 395.517, "r_x1": 532.013, "r_y1": 395.517, "r_x2": 532.013, "r_y2": 387.763, "r_x3": 523.229, "r_y3": 387.763, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 411.572, "t": 400.198, "r": 420.356, "b": 407.952, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.572, "r_y0": 407.952, "r_x1": 420.356, "r_y1": 407.952, "r_x2": 420.356, "r_y2": 400.198, "r_x3": 411.572, "r_y3": 400.198, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 442.305, "t": 399.81, "r": 451.089, "b": 407.564, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.305, "r_y0": 407.564, "r_x1": 451.089, "r_y1": 407.564, "r_x2": 451.089, "r_y2": 399.81, "r_x3": 442.305, "r_y3": 399.81, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 478.779, "t": 399.769, "r": 487.563, "b": 407.524, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.779, "r_y0": 407.524, "r_x1": 487.563, "r_y1": 407.524, "r_x2": 487.563, "r_y2": 399.769, "r_x3": 478.779, "r_y3": 399.769, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 523.972, "t": 399.385, "r": 532.756, "b": 407.139, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 523.972, "r_y0": 407.139, "r_x1": 532.756, "r_y1": 407.139, "r_x2": 532.756, "r_y2": 399.385, "r_x3": 523.972, "r_y3": 399.385, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 83, "label": "text", "bbox": {"l": 385.094, "t": 357.89, "r": 391.099, "b": 367.853, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.094, "r_y0": 367.853, "r_x1": 391.099, "r_y1": 367.853, "r_x2": 391.099, "r_y2": 357.89, "r_x3": 385.094, "r_y3": 357.89, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 86, "label": "text", "bbox": {"l": 333.435, "t": 380.856, "r": 339.439, "b": 390.82, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.435, "r_y0": 390.82, "r_x1": 339.439, "r_y1": 390.82, "r_x2": 339.439, "r_y2": 380.856, "r_x3": 333.435, "r_y3": 380.856, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 88, "label": "text", "bbox": {"l": 478.072, "t": 341.166, "r": 484.077, "b": 351.13, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.072, "r_y0": 351.13, "r_x1": 484.077, "r_y1": 351.13, "r_x2": 484.077, "r_y2": 341.166, "r_x3": 478.072, "r_y3": 341.166, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 23, "page_no": 0, "cluster": {"id": 23, "label": "picture", "bbox": {"l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT"}, "confidence": 0.5088632702827454, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 446.213, "r_x1": 351.641, "r_y1": 446.213, "r_x2": 351.641, "r_y2": 438.459, "r_x3": 347.249, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.881, "r_y0": 446.213, "r_x1": 323.273, "r_y1": 446.213, "r_x2": 323.273, "r_y2": 438.459, "r_x3": 318.881, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 446.213, "r_x1": 398.497, "r_y1": 446.213, "r_x2": 398.497, "r_y2": 438.459, "r_x3": 394.104, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 458.073, "r_x1": 323.166, "r_y1": 458.073, "r_x2": 323.166, "r_y2": 450.319, "r_x3": 318.773, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 458.073, "r_x1": 351.641, "r_y1": 458.073, "r_x2": 351.641, "r_y2": 450.319, "r_x3": 347.249, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 458.073, "r_x1": 398.497, "r_y1": 458.073, "r_x2": 398.497, "r_y2": 450.319, "r_x3": 394.104, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 458.073, "r_x1": 445.352, "r_y1": 458.073, "r_x2": 445.352, "r_y2": 450.319, "r_x3": 440.959, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 458.073, "r_x1": 492.207, "r_y1": 458.073, "r_x2": 492.207, "r_y2": 450.319, "r_x3": 487.815, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 482.232, "r_x1": 323.166, "r_y1": 482.232, "r_x2": 323.166, "r_y2": 474.477, "r_x3": 318.773, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 470.372, "r_x1": 351.641, "r_y1": 470.372, "r_x2": 351.641, "r_y2": 462.618, "r_x3": 347.249, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 470.372, "r_x1": 402.888, "r_y1": 470.372, "r_x2": 402.888, "r_y2": 462.618, "r_x3": 394.104, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 470.372, "r_x1": 449.423, "r_y1": 470.372, "r_x2": 449.423, "r_y2": 462.618, "r_x3": 440.959, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 470.372, "r_x1": 496.599, "r_y1": 470.372, "r_x2": 496.599, "r_y2": 462.618, "r_x3": 487.815, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 482.232, "r_x1": 356.033, "r_y1": 482.232, "r_x2": 356.033, "r_y2": 474.477, "r_x3": 347.249, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 482.232, "r_x1": 402.888, "r_y1": 482.232, "r_x2": 402.888, "r_y2": 474.477, "r_x3": 394.104, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 482.232, "r_x1": 449.743, "r_y1": 482.232, "r_x2": 449.743, "r_y2": 474.477, "r_x3": 440.959, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 482.232, "r_x1": 496.599, "r_y1": 482.232, "r_x2": 496.599, "r_y2": 474.477, "r_x3": 487.815, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 493.652, "r_x1": 356.033, "r_y1": 493.652, "r_x2": 356.033, "r_y2": 485.898, "r_x3": 347.249, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 493.652, "r_x1": 402.888, "r_y1": 493.652, "r_x2": 402.888, "r_y2": 485.898, "r_x3": 394.104, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 493.652, "r_x1": 449.743, "r_y1": 493.652, "r_x2": 449.743, "r_y2": 485.898, "r_x3": 440.959, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 493.652, "r_x1": 496.599, "r_y1": 493.652, "r_x2": 496.599, "r_y2": 485.898, "r_x3": 487.815, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.701, "r_y0": 459.214, "r_x1": 372.706, "r_y1": 459.214, "r_x2": 372.706, "r_y2": 449.25, "r_x3": 366.701, "r_y3": 449.25, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.904, "r_y0": 483.416, "r_x1": 337.909, "r_y1": 483.416, "r_x2": 337.909, "r_y2": 473.452, "r_x3": 331.904, "r_y3": 473.452, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.876, "r_y0": 447.687, "r_x1": 465.881, "r_y1": 447.687, "r_x2": 465.881, "r_y2": 437.723, "r_x3": 459.876, "r_y3": 437.723, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 61, "label": "text", "bbox": {"l": 347.249, "t": 438.459, "r": 351.641, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 446.213, "r_x1": 351.641, "r_y1": 446.213, "r_x2": 351.641, "r_y2": 438.459, "r_x3": 347.249, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 318.881, "t": 438.459, "r": 323.273, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.881, "r_y0": 446.213, "r_x1": 323.273, "r_y1": 446.213, "r_x2": 323.273, "r_y2": 438.459, "r_x3": 318.881, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 394.104, "t": 438.459, "r": 398.497, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 446.213, "r_x1": 398.497, "r_y1": 446.213, "r_x2": 398.497, "r_y2": 438.459, "r_x3": 394.104, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 318.773, "t": 450.319, "r": 323.166, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 458.073, "r_x1": 323.166, "r_y1": 458.073, "r_x2": 323.166, "r_y2": 450.319, "r_x3": 318.773, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 347.249, "t": 450.319, "r": 351.641, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 458.073, "r_x1": 351.641, "r_y1": 458.073, "r_x2": 351.641, "r_y2": 450.319, "r_x3": 347.249, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 394.104, "t": 450.319, "r": 398.497, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 458.073, "r_x1": 398.497, "r_y1": 458.073, "r_x2": 398.497, "r_y2": 450.319, "r_x3": 394.104, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 440.959, "t": 450.319, "r": 445.352, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 458.073, "r_x1": 445.352, "r_y1": 458.073, "r_x2": 445.352, "r_y2": 450.319, "r_x3": 440.959, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 487.815, "t": 450.319, "r": 492.207, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 458.073, "r_x1": 492.207, "r_y1": 458.073, "r_x2": 492.207, "r_y2": 450.319, "r_x3": 487.815, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 318.773, "t": 474.477, "r": 323.166, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 482.232, "r_x1": 323.166, "r_y1": 482.232, "r_x2": 323.166, "r_y2": 474.477, "r_x3": 318.773, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 347.249, "t": 462.618, "r": 351.641, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 470.372, "r_x1": 351.641, "r_y1": 470.372, "r_x2": 351.641, "r_y2": 462.618, "r_x3": 347.249, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 394.104, "t": 462.618, "r": 402.888, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 470.372, "r_x1": 402.888, "r_y1": 470.372, "r_x2": 402.888, "r_y2": 462.618, "r_x3": 394.104, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 440.959, "t": 462.618, "r": 449.423, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 470.372, "r_x1": 449.423, "r_y1": 470.372, "r_x2": 449.423, "r_y2": 462.618, "r_x3": 440.959, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 487.815, "t": 462.618, "r": 496.599, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 470.372, "r_x1": 496.599, "r_y1": 470.372, "r_x2": 496.599, "r_y2": 462.618, "r_x3": 487.815, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 347.249, "t": 474.477, "r": 356.033, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 482.232, "r_x1": 356.033, "r_y1": 482.232, "r_x2": 356.033, "r_y2": 474.477, "r_x3": 347.249, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 394.104, "t": 474.477, "r": 402.888, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 482.232, "r_x1": 402.888, "r_y1": 482.232, "r_x2": 402.888, "r_y2": 474.477, "r_x3": 394.104, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 440.959, "t": 474.477, "r": 449.743, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 482.232, "r_x1": 449.743, "r_y1": 482.232, "r_x2": 449.743, "r_y2": 474.477, "r_x3": 440.959, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 487.815, "t": 474.477, "r": 496.599, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 482.232, "r_x1": 496.599, "r_y1": 482.232, "r_x2": 496.599, "r_y2": 474.477, "r_x3": 487.815, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 347.249, "t": 485.898, "r": 356.033, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 493.652, "r_x1": 356.033, "r_y1": 493.652, "r_x2": 356.033, "r_y2": 485.898, "r_x3": 347.249, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 394.104, "t": 485.898, "r": 402.888, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 493.652, "r_x1": 402.888, "r_y1": 493.652, "r_x2": 402.888, "r_y2": 485.898, "r_x3": 394.104, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 440.959, "t": 485.898, "r": 449.743, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 493.652, "r_x1": 449.743, "r_y1": 493.652, "r_x2": 449.743, "r_y2": 485.898, "r_x3": 440.959, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 487.815, "t": 485.898, "r": 496.599, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 493.652, "r_x1": 496.599, "r_y1": 493.652, "r_x2": 496.599, "r_y2": 485.898, "r_x3": 487.815, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 366.701, "t": 449.25, "r": 372.706, "b": 459.214, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.701, "r_y0": 459.214, "r_x1": 372.706, "r_y1": 459.214, "r_x2": 372.706, "r_y2": 449.25, "r_x3": 366.701, "r_y3": 449.25, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 331.904, "t": 473.452, "r": 337.909, "b": 483.416, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.904, "r_y0": 483.416, "r_x1": 337.909, "r_y1": 483.416, "r_x2": 337.909, "r_y2": 473.452, "r_x3": 331.904, "r_y3": 473.452, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 459.876, "t": 437.723, "r": 465.881, "b": 447.687, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.876, "r_y0": 447.687, "r_x1": 465.881, "r_y1": 447.687, "r_x2": 465.881, "r_y2": 437.723, "r_x3": 459.876, "r_y3": 437.723, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 11, "page_no": 0, "cluster": {"id": 11, "label": "table", "bbox": {"l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT"}, "confidence": 0.8056110739707947, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 446.213, "r_x1": 351.641, "r_y1": 446.213, "r_x2": 351.641, "r_y2": 438.459, "r_x3": 347.249, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.881, "r_y0": 446.213, "r_x1": 323.273, "r_y1": 446.213, "r_x2": 323.273, "r_y2": 438.459, "r_x3": 318.881, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 446.213, "r_x1": 398.497, "r_y1": 446.213, "r_x2": 398.497, "r_y2": 438.459, "r_x3": 394.104, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 458.073, "r_x1": 323.166, "r_y1": 458.073, "r_x2": 323.166, "r_y2": 450.319, "r_x3": 318.773, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 458.073, "r_x1": 351.641, "r_y1": 458.073, "r_x2": 351.641, "r_y2": 450.319, "r_x3": 347.249, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 458.073, "r_x1": 398.497, "r_y1": 458.073, "r_x2": 398.497, "r_y2": 450.319, "r_x3": 394.104, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 458.073, "r_x1": 445.352, "r_y1": 458.073, "r_x2": 445.352, "r_y2": 450.319, "r_x3": 440.959, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 458.073, "r_x1": 492.207, "r_y1": 458.073, "r_x2": 492.207, "r_y2": 450.319, "r_x3": 487.815, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 482.232, "r_x1": 323.166, "r_y1": 482.232, "r_x2": 323.166, "r_y2": 474.477, "r_x3": 318.773, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 470.372, "r_x1": 351.641, "r_y1": 470.372, "r_x2": 351.641, "r_y2": 462.618, "r_x3": 347.249, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 470.372, "r_x1": 402.888, "r_y1": 470.372, "r_x2": 402.888, "r_y2": 462.618, "r_x3": 394.104, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 470.372, "r_x1": 449.423, "r_y1": 470.372, "r_x2": 449.423, "r_y2": 462.618, "r_x3": 440.959, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 470.372, "r_x1": 496.599, "r_y1": 470.372, "r_x2": 496.599, "r_y2": 462.618, "r_x3": 487.815, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 482.232, "r_x1": 356.033, "r_y1": 482.232, "r_x2": 356.033, "r_y2": 474.477, "r_x3": 347.249, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 482.232, "r_x1": 402.888, "r_y1": 482.232, "r_x2": 402.888, "r_y2": 474.477, "r_x3": 394.104, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 482.232, "r_x1": 449.743, "r_y1": 482.232, "r_x2": 449.743, "r_y2": 474.477, "r_x3": 440.959, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 482.232, "r_x1": 496.599, "r_y1": 482.232, "r_x2": 496.599, "r_y2": 474.477, "r_x3": 487.815, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 493.652, "r_x1": 356.033, "r_y1": 493.652, "r_x2": 356.033, "r_y2": 485.898, "r_x3": 347.249, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 493.652, "r_x1": 402.888, "r_y1": 493.652, "r_x2": 402.888, "r_y2": 485.898, "r_x3": 394.104, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 493.652, "r_x1": 449.743, "r_y1": 493.652, "r_x2": 449.743, "r_y2": 485.898, "r_x3": 440.959, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 493.652, "r_x1": 496.599, "r_y1": 493.652, "r_x2": 496.599, "r_y2": 485.898, "r_x3": 487.815, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.701, "r_y0": 459.214, "r_x1": 372.706, "r_y1": 459.214, "r_x2": 372.706, "r_y2": 449.25, "r_x3": 366.701, "r_y3": 449.25, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.904, "r_y0": 483.416, "r_x1": 337.909, "r_y1": 483.416, "r_x2": 337.909, "r_y2": 473.452, "r_x3": 331.904, "r_y3": 473.452, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.876, "r_y0": 447.687, "r_x1": 465.881, "r_y1": 447.687, "r_x2": 465.881, "r_y2": 437.723, "r_x3": 459.876, "r_y3": 437.723, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 61, "label": "text", "bbox": {"l": 347.249, "t": 438.459, "r": 351.641, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 446.213, "r_x1": 351.641, "r_y1": 446.213, "r_x2": 351.641, "r_y2": 438.459, "r_x3": 347.249, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 318.881, "t": 438.459, "r": 323.273, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.881, "r_y0": 446.213, "r_x1": 323.273, "r_y1": 446.213, "r_x2": 323.273, "r_y2": 438.459, "r_x3": 318.881, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 394.104, "t": 438.459, "r": 398.497, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 446.213, "r_x1": 398.497, "r_y1": 446.213, "r_x2": 398.497, "r_y2": 438.459, "r_x3": 394.104, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 318.773, "t": 450.319, "r": 323.166, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 458.073, "r_x1": 323.166, "r_y1": 458.073, "r_x2": 323.166, "r_y2": 450.319, "r_x3": 318.773, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 347.249, "t": 450.319, "r": 351.641, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 458.073, "r_x1": 351.641, "r_y1": 458.073, "r_x2": 351.641, "r_y2": 450.319, "r_x3": 347.249, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 394.104, "t": 450.319, "r": 398.497, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 458.073, "r_x1": 398.497, "r_y1": 458.073, "r_x2": 398.497, "r_y2": 450.319, "r_x3": 394.104, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 440.959, "t": 450.319, "r": 445.352, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 458.073, "r_x1": 445.352, "r_y1": 458.073, "r_x2": 445.352, "r_y2": 450.319, "r_x3": 440.959, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 487.815, "t": 450.319, "r": 492.207, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 458.073, "r_x1": 492.207, "r_y1": 458.073, "r_x2": 492.207, "r_y2": 450.319, "r_x3": 487.815, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 318.773, "t": 474.477, "r": 323.166, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 482.232, "r_x1": 323.166, "r_y1": 482.232, "r_x2": 323.166, "r_y2": 474.477, "r_x3": 318.773, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 347.249, "t": 462.618, "r": 351.641, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 470.372, "r_x1": 351.641, "r_y1": 470.372, "r_x2": 351.641, "r_y2": 462.618, "r_x3": 347.249, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 394.104, "t": 462.618, "r": 402.888, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 470.372, "r_x1": 402.888, "r_y1": 470.372, "r_x2": 402.888, "r_y2": 462.618, "r_x3": 394.104, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 440.959, "t": 462.618, "r": 449.423, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 470.372, "r_x1": 449.423, "r_y1": 470.372, "r_x2": 449.423, "r_y2": 462.618, "r_x3": 440.959, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 487.815, "t": 462.618, "r": 496.599, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 470.372, "r_x1": 496.599, "r_y1": 470.372, "r_x2": 496.599, "r_y2": 462.618, "r_x3": 487.815, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 347.249, "t": 474.477, "r": 356.033, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 482.232, "r_x1": 356.033, "r_y1": 482.232, "r_x2": 356.033, "r_y2": 474.477, "r_x3": 347.249, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 394.104, "t": 474.477, "r": 402.888, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 482.232, "r_x1": 402.888, "r_y1": 482.232, "r_x2": 402.888, "r_y2": 474.477, "r_x3": 394.104, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 440.959, "t": 474.477, "r": 449.743, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 482.232, "r_x1": 449.743, "r_y1": 482.232, "r_x2": 449.743, "r_y2": 474.477, "r_x3": 440.959, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 487.815, "t": 474.477, "r": 496.599, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 482.232, "r_x1": 496.599, "r_y1": 482.232, "r_x2": 496.599, "r_y2": 474.477, "r_x3": 487.815, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 347.249, "t": 485.898, "r": 356.033, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 493.652, "r_x1": 356.033, "r_y1": 493.652, "r_x2": 356.033, "r_y2": 485.898, "r_x3": 347.249, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 394.104, "t": 485.898, "r": 402.888, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 493.652, "r_x1": 402.888, "r_y1": 493.652, "r_x2": 402.888, "r_y2": 485.898, "r_x3": 394.104, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 440.959, "t": 485.898, "r": 449.743, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 493.652, "r_x1": 449.743, "r_y1": 493.652, "r_x2": 449.743, "r_y2": 485.898, "r_x3": 440.959, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 487.815, "t": 485.898, "r": 496.599, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 493.652, "r_x1": 496.599, "r_y1": 493.652, "r_x2": 496.599, "r_y2": 485.898, "r_x3": 487.815, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 366.701, "t": 449.25, "r": 372.706, "b": 459.214, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.701, "r_y0": 459.214, "r_x1": 372.706, "r_y1": 459.214, "r_x2": 372.706, "r_y2": 449.25, "r_x3": 366.701, "r_y3": 449.25, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 331.904, "t": 473.452, "r": 337.909, "b": 483.416, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.904, "r_y0": 483.416, "r_x1": 337.909, "r_y1": 483.416, "r_x2": 337.909, "r_y2": 473.452, "r_x3": 331.904, "r_y3": 473.452, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 459.876, "t": 437.723, "r": 465.881, "b": 447.687, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.876, "r_y0": 447.687, "r_x1": 465.881, "r_y1": 447.687, "r_x2": 465.881, "r_y2": 437.723, "r_x3": 459.876, "r_y3": 437.723, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["fcel", "fcel", "lcel", "lcel", "lcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 5, "num_cols": 5, "table_cells": [{"bbox": {"l": 347.249, "t": 437.723, "r": 465.881, "b": 447.687, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 4, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 5, "text": "1 2 1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 318.881, "t": 438.459, "r": 323.273, "b": 446.213, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 318.773, "t": 450.319, "r": 323.166, "b": 458.073, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 347.249, "t": 449.25, "r": 372.706, "b": 459.214, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4 3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.104, "t": 450.319, "r": 398.497, "b": 458.073, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "5", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 440.959, "t": 450.319, "r": 445.352, "b": 458.073, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "6", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 487.815, "t": 450.319, "r": 492.207, "b": 458.073, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "7", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 318.773, "t": 473.452, "r": 337.909, "b": 483.416, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "8 2", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 347.249, "t": 462.618, "r": 351.641, "b": 470.372, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "9", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.104, "t": 462.618, "r": 402.888, "b": 470.372, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "10", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 440.959, "t": 462.618, "r": 449.423, "b": 470.372, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "11", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 487.815, "t": 462.618, "r": 496.599, "b": 470.372, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "12", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 347.249, "t": 474.477, "r": 356.033, "b": 482.232, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "13", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.104, "t": 474.477, "r": 402.888, "b": 482.232, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "14", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 440.959, "t": 474.477, "r": 449.743, "b": 482.232, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "15", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 487.815, "t": 474.477, "r": 496.599, "b": 482.232, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "16", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 347.249, "t": 485.898, "r": 356.033, "b": 493.652, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "17", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.104, "t": 485.898, "r": 402.888, "b": 493.652, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "18", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 440.959, "t": 485.898, "r": 449.743, "b": 493.652, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "19", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 487.815, "t": 485.898, "r": 496.599, "b": 493.652, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "20", "column_header": false, "row_header": false, "row_section": false}]}, {"label": "picture", "id": 16, "page_no": 0, "cluster": {"id": 16, "label": "picture", "bbox": {"l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT"}, "confidence": 0.608779788017273, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.946, "r_y0": 245.44000000000005, "r_x1": 457.951, "r_y1": 245.44000000000005, "r_x2": 457.951, "r_y2": 235.47699999999998, "r_x3": 451.946, "r_y3": 235.47699999999998, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.197, "r_y0": 279.446, "r_x1": 337.202, "r_y1": 279.446, "r_x2": 337.202, "r_y2": 269.48199999999997, "r_x3": 331.197, "r_y3": 269.48199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.033, "r_y0": 262.77200000000005, "r_x1": 390.038, "r_y1": 262.77200000000005, "r_x2": 390.038, "r_y2": 252.80899999999997, "r_x3": 384.033, "r_y3": 252.80899999999997, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 82, "label": "text", "bbox": {"l": 451.946, "t": 235.47699999999998, "r": 457.951, "b": 245.44000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.946, "r_y0": 245.44000000000005, "r_x1": 457.951, "r_y1": 245.44000000000005, "r_x2": 457.951, "r_y2": 235.47699999999998, "r_x3": 451.946, "r_y3": 235.47699999999998, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 331.197, "t": 269.48199999999997, "r": 337.202, "b": 279.446, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.197, "r_y0": 279.446, "r_x1": 337.202, "r_y1": 279.446, "r_x2": 337.202, "r_y2": 269.48199999999997, "r_x3": 331.197, "r_y3": 269.48199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 384.033, "t": 252.80899999999997, "r": 390.038, "b": 262.77200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.033, "r_y0": 262.77200000000005, "r_x1": 390.038, "r_y1": 262.77200000000005, "r_x2": 390.038, "r_y2": 252.80899999999997, "r_x3": 384.033, "r_y3": 252.80899999999997, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 15, "page_no": 0, "cluster": {"id": 15, "label": "table", "bbox": {"l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT"}, "confidence": 0.6515864729881287, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.946, "r_y0": 245.44000000000005, "r_x1": 457.951, "r_y1": 245.44000000000005, "r_x2": 457.951, "r_y2": 235.47699999999998, "r_x3": 451.946, "r_y3": 235.47699999999998, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.197, "r_y0": 279.446, "r_x1": 337.202, "r_y1": 279.446, "r_x2": 337.202, "r_y2": 269.48199999999997, "r_x3": 331.197, "r_y3": 269.48199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.033, "r_y0": 262.77200000000005, "r_x1": 390.038, "r_y1": 262.77200000000005, "r_x2": 390.038, "r_y2": 252.80899999999997, "r_x3": 384.033, "r_y3": 252.80899999999997, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 82, "label": "text", "bbox": {"l": 451.946, "t": 235.47699999999998, "r": 457.951, "b": 245.44000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.946, "r_y0": 245.44000000000005, "r_x1": 457.951, "r_y1": 245.44000000000005, "r_x2": 457.951, "r_y2": 235.47699999999998, "r_x3": 451.946, "r_y3": 235.47699999999998, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 331.197, "t": 269.48199999999997, "r": 337.202, "b": 279.446, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.197, "r_y0": 279.446, "r_x1": 337.202, "r_y1": 279.446, "r_x2": 337.202, "r_y2": 269.48199999999997, "r_x3": 331.197, "r_y3": 269.48199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 384.033, "t": 252.80899999999997, "r": 390.038, "b": 262.77200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.033, "r_y0": 262.77200000000005, "r_x1": 390.038, "r_y1": 262.77200000000005, "r_x2": 390.038, "r_y2": 252.80899999999997, "r_x3": 384.033, "r_y3": 252.80899999999997, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 1, "num_cols": 1, "table_cells": [{"bbox": {"l": 451.946, "t": 235.47699999999998, "r": 457.951, "b": 245.44000000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "1", "column_header": true, "row_header": false, "row_section": false}]}, {"label": "caption", "id": 6, "page_no": 0, "cluster": {"id": 6, "label": "caption", "bbox": {"l": 308.862, "t": 514.769, "r": 545.115, "b": 559.187, "coord_origin": "TOPLEFT"}, "confidence": 0.9214619398117065, "cells": [{"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 523.321, "r_x1": 345.734, "r_y1": 523.321, "r_x2": 345.734, "r_y2": 514.769, "r_x3": 308.862, "r_y3": 514.769, "coord_origin": "TOPLEFT"}, "text": "Figure 1:", "orig": "Figure 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 353.176, "r_y0": 523.321, "r_x1": 545.115, "r_y1": 523.321, "r_x2": 545.115, "r_y2": 514.769, "r_x3": 353.176, "r_y3": 514.769, "coord_origin": "TOPLEFT"}, "text": "Picture of a table with subtle, complex features", "orig": "Picture of a table with subtle, complex features", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 535.2760000000001, "r_x1": 545.115, "r_y1": 535.2760000000001, "r_x2": 545.115, "r_y2": 526.7239999999999, "r_x3": 308.862, "r_y3": 526.7239999999999, "coord_origin": "TOPLEFT"}, "text": "such as (1) multi-column headers, (2) cell with multi-row", "orig": "such as (1) multi-column headers, (2) cell with multi-row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 547.231, "r_x1": 445.539, "r_y1": 547.231, "r_x2": 445.539, "r_y2": 538.679, "r_x3": 308.862, "r_y3": 538.679, "coord_origin": "TOPLEFT"}, "text": "text and (3) cells with no content.", "orig": "text and (3) cells with no content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.221, "r_y0": 547.231, "r_x1": 545.115, "r_y1": 547.231, "r_x2": 545.115, "r_y2": 538.679, "r_x3": 450.221, "r_y3": 538.679, "coord_origin": "TOPLEFT"}, "text": "Image from PubTabNet", "orig": "Image from PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 559.187, "r_x1": 505.692, "r_y1": 559.187, "r_x2": 505.692, "r_y2": 550.635, "r_x3": 308.862, "r_y3": 550.635, "coord_origin": "TOPLEFT"}, "text": "evaluation set, filename: 'PMC2944238 004 02'.", "orig": "evaluation set, filename: 'PMC2944238 004 02'.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 1: Picture of a table with subtle, complex features such as (1) multi-column headers, (2) cell with multi-row text and (3) cells with no content. Image from PubTabNet evaluation set, filename: 'PMC2944238 004 02'."}, {"label": "text", "id": 0, "page_no": 0, "cluster": {"id": 0, "label": "text", "bbox": {"l": 308.862, "t": 584.678, "r": 545.115, "b": 664.961, "coord_origin": "TOPLEFT"}, "confidence": 0.9848759770393372, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 593.23, "r_x1": 358.077, "r_y1": 593.23, "r_x2": 358.077, "r_y2": 584.678, "r_x3": 320.817, "r_y3": 584.678, "coord_origin": "TOPLEFT"}, "text": "Recently,", "orig": "Recently,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.62, "r_y0": 593.23, "r_x1": 404.134, "r_y1": 593.23, "r_x2": 404.134, "r_y2": 584.678, "r_x3": 362.62, "r_y3": 584.678, "coord_origin": "TOPLEFT"}, "text": "significant", "orig": "significant", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.259, "r_y0": 593.23, "r_x1": 545.115, "r_y1": 593.23, "r_x2": 545.115, "r_y2": 584.678, "r_x3": 408.259, "r_y3": 584.678, "coord_origin": "TOPLEFT"}, "text": "progress has been made with vi-", "orig": "progress has been made with vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.185, "r_x1": 526.365, "r_y1": 605.185, "r_x2": 526.365, "r_y2": 596.633, "r_x3": 308.862, "r_y3": 596.633, "coord_origin": "TOPLEFT"}, "text": "sion based approaches to extract tables in documents.", "orig": "sion based approaches to extract tables in documents.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 531.426, "r_y0": 605.185, "r_x1": 545.115, "r_y1": 605.185, "r_x2": 545.115, "r_y2": 596.633, "r_x3": 531.426, "r_y3": 596.633, "coord_origin": "TOPLEFT"}, "text": "For", "orig": "For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.14, "r_x1": 545.115, "r_y1": 617.14, "r_x2": 545.115, "r_y2": 608.588, "r_x3": 308.862, "r_y3": 608.588, "coord_origin": "TOPLEFT"}, "text": "the sake of completeness, the issue of table extraction from", "orig": "the sake of completeness, the issue of table extraction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.095, "r_x1": 545.115, "r_y1": 629.095, "r_x2": 545.115, "r_y2": 620.543, "r_x3": 308.862, "r_y3": 620.543, "coord_origin": "TOPLEFT"}, "text": "documents is typically decomposed into two separate chal-", "orig": "documents is typically decomposed into two separate chal-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.0509999999999, "r_x1": 336.807, "r_y1": 641.0509999999999, "r_x2": 336.807, "r_y2": 632.499, "r_x3": 308.862, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "lenges,", "orig": "lenges,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.519, "r_y0": 641.0509999999999, "r_x1": 353.694, "r_y1": 641.0509999999999, "r_x2": 353.694, "r_y2": 632.499, "r_x3": 341.519, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "i.e.", "orig": "i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.112, "r_y0": 641.0509999999999, "r_x1": 373.728, "r_y1": 641.0509999999999, "r_x2": 373.728, "r_y2": 632.499, "r_x3": 362.112, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.992, "r_y0": 641.0509999999999, "r_x1": 406.226, "r_y1": 641.0509999999999, "r_x2": 406.226, "r_y2": 632.499, "r_x3": 377.992, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "finding", "orig": "finding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.5, "r_y0": 641.0509999999999, "r_x1": 422.675, "r_y1": 641.0509999999999, "r_x2": 422.675, "r_y2": 632.499, "r_x3": 410.5, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.939, "r_y0": 641.0509999999999, "r_x1": 459.038, "r_y1": 641.0509999999999, "r_x2": 459.038, "r_y2": 632.499, "r_x3": 426.939, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "location", "orig": "location", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.302, "r_y0": 641.0509999999999, "r_x1": 471.601, "r_y1": 641.0509999999999, "r_x2": 471.601, "r_y2": 632.499, "r_x3": 463.302, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.875, "r_y0": 641.0509999999999, "r_x1": 488.049, "r_y1": 641.0509999999999, "r_x2": 488.049, "r_y2": 632.499, "r_x3": 475.875, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 492.313, "r_y0": 641.0509999999999, "r_x1": 522.191, "r_y1": 641.0509999999999, "r_x2": 522.191, "r_y2": 632.499, "r_x3": 492.313, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "table(s)", "orig": "table(s)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 526.455, "r_y0": 641.0509999999999, "r_x1": 545.115, "r_y1": 641.0509999999999, "r_x2": 545.115, "r_y2": 632.499, "r_x3": 526.455, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "on a", "orig": "on a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.006, "r_x1": 545.115, "r_y1": 653.006, "r_x2": 545.115, "r_y2": 644.454, "r_x3": 308.862, "r_y3": 644.454, "coord_origin": "TOPLEFT"}, "text": "document-page and (2) finding the structure of a given table", "orig": "document-page and (2) finding the structure of a given table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 664.961, "r_x1": 375.552, "r_y1": 664.961, "r_x2": 375.552, "r_y2": 656.409, "r_x3": 308.862, "r_y3": 656.409, "coord_origin": "TOPLEFT"}, "text": "in the document.", "orig": "in the document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Recently, significant progress has been made with vision based approaches to extract tables in documents. For the sake of completeness, the issue of table extraction from documents is typically decomposed into two separate challenges, i.e. (1) finding the location of the table(s) on a document-page and (2) finding the structure of a given table in the document."}, {"label": "text", "id": 3, "page_no": 0, "cluster": {"id": 3, "label": "text", "bbox": {"l": 308.862, "t": 668.649, "r": 545.115, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.979152262210846, "cells": [{"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 320.817, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "The first problem is called table-location and has been", "orig": "The first problem is called table-location and has been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 308.862, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 474.261, "r_y1": 701.111, "r_x2": 474.261, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "of-the-art object-detection networks (e.g.", "orig": "of-the-art object-detection networks (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 479.342, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 479.342, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "YOLO and later", "orig": "YOLO and later", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 395.796, "r_y1": 713.066, "r_x2": 395.796, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "on Mask-RCNN [9]).", "orig": "on Mask-RCNN [9]).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.046, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 401.046, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "For all practical purposes, it can be", "orig": "For all practical purposes, it can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The first problem is called table-location and has been previously addressed [30, 38, 19, 21, 23, 26, 8] with stateof-the-art object-detection networks (e.g. YOLO and later on Mask-RCNN [9]). For all practical purposes, it can be"}, {"label": "page_footer", "id": 12, "page_no": 0, "cluster": {"id": 12, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8045893311500549, "cells": [{"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1"}, {"label": "page_header", "id": 9, "page_no": 0, "cluster": {"id": 9, "label": "page_header", "bbox": {"l": 18.34, "t": 210.0, "r": 36.34, "b": 560.0, "coord_origin": "TOPLEFT"}, "confidence": 0.8773143887519836, "cells": [{"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 560.0, "r_x1": 36.34, "r_y1": 380.0, "r_x2": 18.34, "r_y2": 380.0, "r_x3": 18.34, "r_y3": 560.0, "coord_origin": "TOPLEFT"}, "text": "arXiv:2203.01017v2", "orig": "arXiv:2203.01017v2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 360.0, "r_x1": 36.34, "r_y1": 290.0, "r_x2": 18.34, "r_y2": 290.0, "r_x3": 18.34, "r_y3": 360.0, "coord_origin": "TOPLEFT"}, "text": "[cs.CV]", "orig": "[cs.CV]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 270.0, "r_x1": 36.34, "r_y1": 250.0, "r_x2": 18.34, "r_y2": 250.0, "r_x3": 18.34, "r_y3": 270.0, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 240.0, "r_x1": 36.34, "r_y1": 210.0, "r_x2": 18.34, "r_y2": 210.0, "r_x3": 18.34, "r_y3": 240.0, "coord_origin": "TOPLEFT"}, "text": "Mar", "orig": "Mar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "arXiv:2203.01017v2 [cs.CV] 11 Mar"}, {"label": "text", "id": 91, "page_no": 0, "cluster": {"id": 91, "label": "text", "bbox": {"l": 18.34, "t": 160.0, "r": 36.34, "b": 200.0, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 200.0, "r_x1": 36.34, "r_y1": 160.0, "r_x2": 18.34, "r_y2": 160.0, "r_x3": 18.34, "r_y3": 200.0, "coord_origin": "TOPLEFT"}, "text": "2022", "orig": "2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2022"}], "body": [{"label": "section_header", "id": 8, "page_no": 0, "cluster": {"id": 8, "label": "section_header", "bbox": {"l": 96.301, "t": 107.03399999999999, "r": 498.927, "b": 119.93100000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.8868067860603333, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.301, "r_y0": 119.93100000000004, "r_x1": 498.927, "r_y1": 119.93100000000004, "r_x2": 498.927, "r_y2": 107.03399999999999, "r_x3": 96.301, "r_y3": 107.03399999999999, "coord_origin": "TOPLEFT"}, "text": "TableFormer: Table Structure Understanding with Transformers.", "orig": "TableFormer: Table Structure Understanding with Transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TableFormer: Table Structure Understanding with Transformers."}, {"label": "section_header", "id": 13, "page_no": 0, "cluster": {"id": 13, "label": "section_header", "bbox": {"l": 142.477, "t": 147.00800000000004, "r": 452.75, "b": 171.21699999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.7586215734481812, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.477, "r_y0": 157.26999999999998, "r_x1": 452.75, "r_y1": 157.26999999999998, "r_x2": 452.75, "r_y2": 147.00800000000004, "r_x3": 142.477, "r_y3": 147.00800000000004, "coord_origin": "TOPLEFT"}, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "orig": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.918, "r_y0": 171.21699999999998, "r_x1": 332.306, "r_y1": 171.21699999999998, "r_x2": 332.306, "r_y2": 160.95500000000004, "r_x3": 262.918, "r_y3": 160.95500000000004, "coord_origin": "TOPLEFT"}, "text": "IBM Research", "orig": "IBM Research", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Ahmed Nassar, Nikolaos Livathinos, Maksym Lysak, Peter Staar IBM Research"}, {"label": "key_value_region", "id": 25, "page_no": 0, "cluster": {"id": 25, "label": "key_value_region", "bbox": {"l": 208.123, "t": 176.562, "r": 378.733, "b": 184.26999999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.4854728579521179, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.123, "r_y0": 184.26999999999998, "r_x1": 212.731, "r_y1": 184.26999999999998, "r_x2": 212.731, "r_y2": 176.562, "r_x3": 208.123, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.73, "r_y0": 183.861, "r_x1": 378.733, "r_y1": 183.861, "r_x2": 378.733, "r_y2": 177.692, "r_x3": 212.73, "r_y3": 177.692, "coord_origin": "TOPLEFT"}, "text": "ahn,nli,mly,taa @zurich.ibm.com", "orig": "ahn,nli,mly,taa @zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.428, "r_y0": 184.26999999999998, "r_x1": 298.036, "r_y1": 184.26999999999998, "r_x2": 298.036, "r_y2": 176.562, "r_x3": 293.428, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 7, "label": "text", "bbox": {"l": 208.123, "t": 176.562, "r": 378.733, "b": 184.26999999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9096331596374512, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.123, "r_y0": 184.26999999999998, "r_x1": 212.731, "r_y1": 184.26999999999998, "r_x2": 212.731, "r_y2": 176.562, "r_x3": 208.123, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.73, "r_y0": 183.861, "r_x1": 378.733, "r_y1": 183.861, "r_x2": 378.733, "r_y2": 177.692, "r_x3": 212.73, "r_y3": 177.692, "coord_origin": "TOPLEFT"}, "text": "ahn,nli,mly,taa @zurich.ibm.com", "orig": "ahn,nli,mly,taa @zurich.ibm.com", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 293.428, "r_y0": 184.26999999999998, "r_x1": 298.036, "r_y1": 184.26999999999998, "r_x2": 298.036, "r_y2": 176.562, "r_x3": 293.428, "r_y3": 176.562, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null}, {"label": "section_header", "id": 5, "page_no": 0, "cluster": {"id": 5, "label": "section_header", "bbox": {"l": 145.995, "t": 215.48299999999995, "r": 190.48, "b": 226.231, "coord_origin": "TOPLEFT"}, "confidence": 0.9258671402931213, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.995, "r_y0": 226.231, "r_x1": 190.48, "r_y1": 226.231, "r_x2": 190.48, "r_y2": 215.48299999999995, "r_x3": 145.995, "r_y3": 215.48299999999995, "coord_origin": "TOPLEFT"}, "text": "Abstract", "orig": "Abstract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Abstract"}, {"label": "text", "id": 2, "page_no": 0, "cluster": {"id": 2, "label": "text", "bbox": {"l": 50.112, "t": 241.39499999999998, "r": 286.365, "b": 512.9970000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9838882088661194, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 249.98299999999995, "r_x1": 286.365, "r_y1": 249.98299999999995, "r_x2": 286.365, "r_y2": 241.39499999999998, "r_x3": 62.067, "r_y3": 241.39499999999998, "coord_origin": "TOPLEFT"}, "text": "Tables organize valuable content in a concise and com-", "orig": "Tables organize valuable content in a concise and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 261.938, "r_x1": 130.062, "r_y1": 261.938, "r_x2": 130.062, "r_y2": 253.35000000000002, "r_x3": 50.112, "r_y3": 253.35000000000002, "coord_origin": "TOPLEFT"}, "text": "pact representation.", "orig": "pact representation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.475, "r_y0": 261.938, "r_x1": 286.365, "r_y1": 261.938, "r_x2": 286.365, "r_y2": 253.35000000000002, "r_x3": 134.475, "r_y3": 253.35000000000002, "coord_origin": "TOPLEFT"}, "text": "This content is extremely valuable for", "orig": "This content is extremely valuable for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 273.89300000000003, "r_x1": 286.365, "r_y1": 273.89300000000003, "r_x2": 286.365, "r_y2": 265.30499999999995, "r_x3": 50.112, "r_y3": 265.30499999999995, "coord_origin": "TOPLEFT"}, "text": "systems such as search engines, Knowledge Graph's, etc,", "orig": "systems such as search engines, Knowledge Graph's, etc,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 285.849, "r_x1": 245.18, "r_y1": 285.849, "r_x2": 245.18, "r_y2": 277.26099999999997, "r_x3": 50.112, "r_y3": 277.26099999999997, "coord_origin": "TOPLEFT"}, "text": "since they enhance their predictive capabilities.", "orig": "since they enhance their predictive capabilities.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.496, "r_y0": 285.849, "r_x1": 286.365, "r_y1": 285.849, "r_x2": 286.365, "r_y2": 277.26099999999997, "r_x3": 251.496, "r_y3": 277.26099999999997, "coord_origin": "TOPLEFT"}, "text": "Unfortu-", "orig": "Unfortu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 297.804, "r_x1": 286.365, "r_y1": 297.804, "r_x2": 286.365, "r_y2": 289.216, "r_x3": 50.112, "r_y3": 289.216, "coord_origin": "TOPLEFT"}, "text": "nately, tables come in a large variety of shapes and sizes.", "orig": "nately, tables come in a large variety of shapes and sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 309.759, "r_x1": 103.601, "r_y1": 309.759, "r_x2": 103.601, "r_y2": 301.171, "r_x3": 50.112, "r_y3": 301.171, "coord_origin": "TOPLEFT"}, "text": "Furthermore,", "orig": "Furthermore,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 108.393, "r_y0": 309.759, "r_x1": 124.692, "r_y1": 309.759, "r_x2": 124.692, "r_y2": 301.171, "r_x3": 108.393, "r_y3": 301.171, "coord_origin": "TOPLEFT"}, "text": "they", "orig": "they", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.026, "r_y0": 309.759, "r_x1": 286.365, "r_y1": 309.759, "r_x2": 286.365, "r_y2": 301.171, "r_x3": 129.026, "r_y3": 301.171, "coord_origin": "TOPLEFT"}, "text": "can have complex column/row-header", "orig": "can have complex column/row-header", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 321.714, "r_x1": 286.365, "r_y1": 321.714, "r_x2": 286.365, "r_y2": 313.126, "r_x3": 50.112, "r_y3": 313.126, "coord_origin": "TOPLEFT"}, "text": "configurations, multiline rows, different variety of separa-", "orig": "configurations, multiline rows, different variety of separa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 333.669, "r_x1": 175.123, "r_y1": 333.669, "r_x2": 175.123, "r_y2": 325.081, "r_x3": 50.112, "r_y3": 325.081, "coord_origin": "TOPLEFT"}, "text": "tion lines, missing entries, etc.", "orig": "tion lines, missing entries, etc.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.931, "r_y0": 333.669, "r_x1": 286.365, "r_y1": 333.669, "r_x2": 286.365, "r_y2": 325.081, "r_x3": 180.931, "r_y3": 325.081, "coord_origin": "TOPLEFT"}, "text": "As such, the correct iden-", "orig": "As such, the correct iden-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 345.624, "r_x1": 85.539, "r_y1": 345.624, "r_x2": 85.539, "r_y2": 337.036, "r_x3": 50.112, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "tification", "orig": "tification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 89.942, "r_y0": 345.624, "r_x1": 97.693, "r_y1": 345.624, "r_x2": 97.693, "r_y2": 337.036, "r_x3": 89.942, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 102.107, "r_y0": 345.624, "r_x1": 114.281, "r_y1": 345.624, "r_x2": 114.281, "r_y2": 337.036, "r_x3": 102.107, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 118.695, "r_y0": 345.624, "r_x1": 177.534, "r_y1": 345.624, "r_x2": 177.534, "r_y2": 337.036, "r_x3": 118.695, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "table-structure", "orig": "table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.947, "r_y0": 345.624, "r_x1": 286.365, "r_y1": 345.624, "r_x2": 286.365, "r_y2": 337.036, "r_x3": 181.947, "r_y3": 337.036, "coord_origin": "TOPLEFT"}, "text": "from an image is a non-", "orig": "from an image is a non-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 357.58, "r_x1": 95.791, "r_y1": 357.58, "r_x2": 95.791, "r_y2": 348.992, "r_x3": 50.112, "r_y3": 348.992, "coord_origin": "TOPLEFT"}, "text": "trivial task.", "orig": "trivial task.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 99.746, "r_y0": 357.58, "r_x1": 286.365, "r_y1": 357.58, "r_x2": 286.365, "r_y2": 348.992, "r_x3": 99.746, "r_y3": 348.992, "coord_origin": "TOPLEFT"}, "text": "In this paper, we present a new table-structure", "orig": "In this paper, we present a new table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 369.535, "r_x1": 132.443, "r_y1": 369.535, "r_x2": 132.443, "r_y2": 360.947, "r_x3": 50.112, "r_y3": 360.947, "coord_origin": "TOPLEFT"}, "text": "identification model.", "orig": "identification model.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 136.777, "r_y0": 369.535, "r_x1": 286.365, "r_y1": 369.535, "r_x2": 286.365, "r_y2": 360.947, "r_x3": 136.777, "r_y3": 360.947, "coord_origin": "TOPLEFT"}, "text": "The latter improves the latest end-to-", "orig": "The latter improves the latest end-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 381.49, "r_x1": 170.4, "r_y1": 381.49, "r_x2": 170.4, "r_y2": 372.902, "r_x3": 50.112, "r_y3": 372.902, "coord_origin": "TOPLEFT"}, "text": "end deep learning model (i.e.", "orig": "end deep learning model (i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.248, "r_y0": 381.49, "r_x1": 286.365, "r_y1": 381.49, "r_x2": 286.365, "r_y2": 372.902, "r_x3": 176.248, "r_y3": 372.902, "coord_origin": "TOPLEFT"}, "text": "encoder-dual-decoder from", "orig": "encoder-dual-decoder from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 393.445, "r_x1": 196.572, "r_y1": 393.445, "r_x2": 196.572, "r_y2": 384.857, "r_x3": 50.112, "r_y3": 384.857, "coord_origin": "TOPLEFT"}, "text": "PubTabNet) in two significant ways.", "orig": "PubTabNet) in two significant ways.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 201.643, "r_y0": 393.445, "r_x1": 286.365, "r_y1": 393.445, "r_x2": 286.365, "r_y2": 384.857, "r_x3": 201.643, "r_y3": 384.857, "coord_origin": "TOPLEFT"}, "text": "First, we introduce a", "orig": "First, we introduce a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 405.4, "r_x1": 232.328, "r_y1": 405.4, "r_x2": 232.328, "r_y2": 396.812, "r_x3": 50.112, "r_y3": 396.812, "coord_origin": "TOPLEFT"}, "text": "new object detection decoder for table-cells.", "orig": "new object detection decoder for table-cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 238.584, "r_y0": 405.4, "r_x1": 286.365, "r_y1": 405.4, "r_x2": 286.365, "r_y2": 396.812, "r_x3": 238.584, "r_y3": 396.812, "coord_origin": "TOPLEFT"}, "text": "In this way,", "orig": "In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 417.355, "r_x1": 286.365, "r_y1": 417.355, "r_x2": 286.365, "r_y2": 408.767, "r_x3": 50.112, "r_y3": 408.767, "coord_origin": "TOPLEFT"}, "text": "we can obtain the content of the table-cells from program-", "orig": "we can obtain the content of the table-cells from program-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 429.311, "r_x1": 286.365, "r_y1": 429.311, "r_x2": 286.365, "r_y2": 420.723, "r_x3": 50.112, "r_y3": 420.723, "coord_origin": "TOPLEFT"}, "text": "matic PDF's directly from the PDF source and avoid the", "orig": "matic PDF's directly from the PDF source and avoid the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 441.266, "r_x1": 207.232, "r_y1": 441.266, "r_x2": 207.232, "r_y2": 432.678, "r_x3": 50.112, "r_y3": 432.678, "coord_origin": "TOPLEFT"}, "text": "training of the custom OCR decoders.", "orig": "training of the custom OCR decoders.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.096, "r_y0": 441.266, "r_x1": 286.365, "r_y1": 441.266, "r_x2": 286.365, "r_y2": 432.678, "r_x3": 214.096, "r_y3": 432.678, "coord_origin": "TOPLEFT"}, "text": "This architectural", "orig": "This architectural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 453.221, "r_x1": 286.365, "r_y1": 453.221, "r_x2": 286.365, "r_y2": 444.633, "r_x3": 50.112, "r_y3": 444.633, "coord_origin": "TOPLEFT"}, "text": "change leads to more accurate table-content extraction and", "orig": "change leads to more accurate table-content extraction and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 465.176, "r_x1": 204.233, "r_y1": 465.176, "r_x2": 204.233, "r_y2": 456.588, "r_x3": 50.112, "r_y3": 456.588, "coord_origin": "TOPLEFT"}, "text": "allows us to tackle non-english tables.", "orig": "allows us to tackle non-english tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.587, "r_y0": 465.176, "r_x1": 286.365, "r_y1": 465.176, "r_x2": 286.365, "r_y2": 456.588, "r_x3": 208.587, "r_y3": 456.588, "coord_origin": "TOPLEFT"}, "text": "Second, we replace", "orig": "Second, we replace", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 477.131, "r_x1": 286.365, "r_y1": 477.131, "r_x2": 286.365, "r_y2": 468.543, "r_x3": 50.112, "r_y3": 468.543, "coord_origin": "TOPLEFT"}, "text": "the LSTM decoders with transformer based decoders. This", "orig": "the LSTM decoders with transformer based decoders. This", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 489.087, "r_x1": 286.365, "r_y1": 489.087, "r_x2": 286.365, "r_y2": 480.499, "r_x3": 50.112, "r_y3": 480.499, "coord_origin": "TOPLEFT"}, "text": "upgrade improves significantly the previous state-of-the-art", "orig": "upgrade improves significantly the previous state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 501.042, "r_x1": 286.365, "r_y1": 501.042, "r_x2": 286.365, "r_y2": 492.454, "r_x3": 50.112, "r_y3": 492.454, "coord_origin": "TOPLEFT"}, "text": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "orig": "tree-editing-distance-score (TEDS) from 91% to 98.5% on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 512.9970000000001, "r_x1": 276.652, "r_y1": 512.9970000000001, "r_x2": 276.652, "r_y2": 504.409, "r_x3": 50.112, "r_y3": 504.409, "coord_origin": "TOPLEFT"}, "text": "simple tables and from 88.7% to 95% on complex tables.", "orig": "simple tables and from 88.7% to 95% on complex tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Tables organize valuable content in a concise and compact representation. This content is extremely valuable for systems such as search engines, Knowledge Graph's, etc, since they enhance their predictive capabilities. Unfortunately, tables come in a large variety of shapes and sizes. Furthermore, they can have complex column/row-header configurations, multiline rows, different variety of separation lines, missing entries, etc. As such, the correct identification of the table-structure from an image is a nontrivial task. In this paper, we present a new table-structure identification model. The latter improves the latest end-toend deep learning model (i.e. encoder-dual-decoder from PubTabNet) in two significant ways. First, we introduce a new object detection decoder for table-cells. In this way, we can obtain the content of the table-cells from programmatic PDF's directly from the PDF source and avoid the training of the custom OCR decoders. This architectural change leads to more accurate table-content extraction and allows us to tackle non-english tables. Second, we replace the LSTM decoders with transformer based decoders. This upgrade improves significantly the previous state-of-the-art tree-editing-distance-score (TEDS) from 91% to 98.5% on simple tables and from 88.7% to 95% on complex tables."}, {"label": "section_header", "id": 4, "page_no": 0, "cluster": {"id": 4, "label": "section_header", "bbox": {"l": 50.112, "t": 539.943, "r": 126.948, "b": 550.691, "coord_origin": "TOPLEFT"}, "confidence": 0.9317677617073059, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 550.691, "r_x1": 126.948, "r_y1": 550.691, "r_x2": 126.948, "r_y2": 539.943, "r_x3": 50.112, "r_y3": 539.943, "coord_origin": "TOPLEFT"}, "text": "1. Introduction", "orig": "1. Introduction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1. Introduction"}, {"label": "text", "id": 1, "page_no": 0, "cluster": {"id": 1, "label": "text", "bbox": {"l": 50.112, "t": 561.052, "r": 286.365, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9841895699501038, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 569.604, "r_x1": 166.266, "r_y1": 569.604, "r_x2": 166.266, "r_y2": 561.052, "r_x3": 62.067, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "The occurrence of tables", "orig": "The occurrence of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.759, "r_y0": 569.604, "r_x1": 178.51, "r_y1": 569.604, "r_x2": 178.51, "r_y2": 561.052, "r_x3": 170.759, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "in", "orig": "in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.003, "r_y0": 569.604, "r_x1": 286.365, "r_y1": 569.604, "r_x2": 286.365, "r_y2": 561.052, "r_x3": 183.003, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "documents is ubiquitous.", "orig": "documents is ubiquitous.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 581.559, "r_x1": 286.365, "r_y1": 581.559, "r_x2": 286.365, "r_y2": 573.0070000000001, "r_x3": 50.112, "r_y3": 573.0070000000001, "coord_origin": "TOPLEFT"}, "text": "They often summarise quantitative or factual data, which is", "orig": "They often summarise quantitative or factual data, which is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 593.514, "r_x1": 286.365, "r_y1": 593.514, "r_x2": 286.365, "r_y2": 584.962, "r_x3": 50.112, "r_y3": 584.962, "coord_origin": "TOPLEFT"}, "text": "cumbersome to describe in verbose text but nevertheless ex-", "orig": "cumbersome to describe in verbose text but nevertheless ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 605.47, "r_x1": 119.95, "r_y1": 605.47, "r_x2": 119.95, "r_y2": 596.918, "r_x3": 50.112, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "tremely valuable.", "orig": "tremely valuable.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.778, "r_y0": 605.47, "r_x1": 286.365, "r_y1": 605.47, "r_x2": 286.365, "r_y2": 596.918, "r_x3": 125.778, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "Unfortunately, this compact representa-", "orig": "Unfortunately, this compact representa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 617.425, "r_x1": 286.365, "r_y1": 617.425, "r_x2": 286.365, "r_y2": 608.873, "r_x3": 50.112, "r_y3": 608.873, "coord_origin": "TOPLEFT"}, "text": "tion is often not easy to parse by machines. There are many", "orig": "tion is often not easy to parse by machines. There are many", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 629.38, "r_x1": 286.365, "r_y1": 629.38, "r_x2": 286.365, "r_y2": 620.828, "r_x3": 50.112, "r_y3": 620.828, "coord_origin": "TOPLEFT"}, "text": "implicit conventions used to obtain a compact table repre-", "orig": "implicit conventions used to obtain a compact table repre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 641.335, "r_x1": 286.365, "r_y1": 641.335, "r_x2": 286.365, "r_y2": 632.783, "r_x3": 50.112, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "sentation. For example, tables often have complex column-", "orig": "sentation. For example, tables often have complex column-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 653.29, "r_x1": 286.365, "r_y1": 653.29, "r_x2": 286.365, "r_y2": 644.738, "r_x3": 50.112, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "and row-headers in order to reduce duplicated cell content.", "orig": "and row-headers in order to reduce duplicated cell content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 665.245, "r_x1": 286.365, "r_y1": 665.245, "r_x2": 286.365, "r_y2": 656.693, "r_x3": 50.112, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "Lines of different shapes and sizes are leveraged to separate", "orig": "Lines of different shapes and sizes are leveraged to separate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.201, "r_x1": 286.365, "r_y1": 677.201, "r_x2": 286.365, "r_y2": 668.649, "r_x3": 50.112, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "content or indicate a tree structure. Additionally, tables can", "orig": "content or indicate a tree structure. Additionally, tables can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "also have empty/missing table-entries or multi-row textual", "orig": "also have empty/missing table-entries or multi-row textual", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 101.848, "r_y1": 701.111, "r_x2": 101.848, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "table-entries.", "orig": "table-entries.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 106.261, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 106.261, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Fig. 1 shows a table which presents all these", "orig": "Fig. 1 shows a table which presents all these", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 76.403, "r_y1": 713.066, "r_x2": 76.403, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "issues.", "orig": "issues.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The occurrence of tables in documents is ubiquitous. They often summarise quantitative or factual data, which is cumbersome to describe in verbose text but nevertheless extremely valuable. Unfortunately, this compact representation is often not easy to parse by machines. There are many implicit conventions used to obtain a compact table representation. For example, tables often have complex columnand row-headers in order to reduce duplicated cell content. Lines of different shapes and sizes are leveraged to separate content or indicate a tree structure. Additionally, tables can also have empty/missing table-entries or multi-row textual table-entries. Fig. 1 shows a table which presents all these issues."}, {"label": "section_header", "id": 14, "page_no": 0, "cluster": {"id": 14, "label": "section_header", "bbox": {"l": 315.567, "t": 218.34900000000005, "r": 408.441, "b": 226.66200000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.6724023818969727, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 226.66200000000003, "r_x1": 408.441, "r_y1": 226.66200000000003, "r_x2": 408.441, "r_y2": 218.34900000000005, "r_x3": 315.567, "r_y3": 218.34900000000005, "coord_origin": "TOPLEFT"}, "text": "a. Picture of a table:", "orig": "a. Picture of a table:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "a. Picture of a table:"}, {"label": "list_item", "id": 17, "page_no": 0, "cluster": {"id": 17, "label": "list_item", "bbox": {"l": 315.567, "t": 314.037, "r": 486.402, "b": 333.15, "coord_origin": "TOPLEFT"}, "confidence": 0.5549328923225403, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 322.35, "r_x1": 486.402, "r_y1": 322.35, "r_x2": 486.402, "r_y2": 314.037, "r_x3": 315.567, "r_y3": 314.037, "coord_origin": "TOPLEFT"}, "text": "b. Red-annotation of bounding boxes,", "orig": "b. Red-annotation of bounding boxes,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.463, "r_y0": 333.15, "r_x1": 472.474, "r_y1": 333.15, "r_x2": 472.474, "r_y2": 324.837, "r_x3": 326.463, "r_y3": 324.837, "coord_origin": "TOPLEFT"}, "text": "Blue-predictions by TableFormer", "orig": "Blue-predictions by TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "b. Red-annotation of bounding boxes, Blue-predictions by TableFormer"}, {"label": "list_item", "id": 18, "page_no": 0, "cluster": {"id": 18, "label": "list_item", "bbox": {"l": 315.567, "t": 420.525, "r": 491.191, "b": 428.838, "coord_origin": "TOPLEFT"}, "confidence": 0.5501358509063721, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.567, "r_y0": 428.838, "r_x1": 491.191, "r_y1": 428.838, "r_x2": 491.191, "r_y2": 420.525, "r_x3": 315.567, "r_y3": 420.525, "coord_origin": "TOPLEFT"}, "text": "c. Structure predicted by TableFormer:", "orig": "c. Structure predicted by TableFormer:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "c. Structure predicted by TableFormer:"}, {"label": "picture", "id": 10, "page_no": 0, "cluster": {"id": 10, "label": "picture", "bbox": {"l": 314.78173828125, "t": 338.0652770996094, "r": 539.1802978515625, "b": 410.0494384765625, "coord_origin": "TOPLEFT"}, "confidence": 0.8742761611938477, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.148, "r_y0": 351.356, "r_x1": 412.54, "r_y1": 351.356, "r_x2": 412.54, "r_y2": 343.601, "r_x3": 408.148, "r_y3": 343.601, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.11, "r_y0": 350.099, "r_x1": 360.503, "r_y1": 350.099, "r_x2": 360.503, "r_y2": 342.345, "r_x3": 356.11, "r_y3": 342.345, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.678, "r_y0": 349.465, "r_x1": 505.07, "r_y1": 349.465, "r_x2": 505.07, "r_y2": 341.711, "r_x3": 500.678, "r_y3": 341.711, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.134, "r_y0": 360.275, "r_x1": 360.526, "r_y1": 360.275, "r_x2": 360.526, "r_y2": 352.521, "r_x3": 356.134, "r_y3": 352.521, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 402.54, "r_y0": 364.404, "r_x1": 406.932, "r_y1": 364.404, "r_x2": 406.932, "r_y2": 356.65, "r_x3": 402.54, "r_y3": 356.65, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.582, "r_y0": 361.367, "r_x1": 452.974, "r_y1": 361.367, "r_x2": 452.974, "r_y2": 353.613, "r_x3": 448.582, "r_y3": 353.613, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 491.652, "r_y0": 362.234, "r_x1": 496.044, "r_y1": 362.234, "r_x2": 496.044, "r_y2": 354.48, "r_x3": 491.652, "r_y3": 354.48, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 535.138, "r_y0": 361.867, "r_x1": 539.531, "r_y1": 361.867, "r_x2": 539.531, "r_y2": 354.113, "r_x3": 535.138, "r_y3": 354.113, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.828, "r_y0": 395.625, "r_x1": 353.221, "r_y1": 395.625, "r_x2": 353.221, "r_y2": 387.871, "r_x3": 348.828, "r_y3": 387.871, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 389.272, "r_y0": 383.9, "r_x1": 393.664, "r_y1": 383.9, "r_x2": 393.664, "r_y2": 376.145, "r_x3": 389.272, "r_y3": 376.145, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.675, "r_y0": 384.173, "r_x1": 451.459, "r_y1": 384.173, "r_x2": 451.459, "r_y2": 376.419, "r_x3": 442.675, "r_y3": 376.419, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.438, "r_y0": 384.061, "r_x1": 485.902, "r_y1": 384.061, "r_x2": 485.902, "r_y2": 376.307, "r_x3": 477.438, "r_y3": 376.307, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 522.573, "r_y0": 384.173, "r_x1": 531.357, "r_y1": 384.173, "r_x2": 531.357, "r_y2": 376.419, "r_x3": 522.573, "r_y3": 376.419, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.23, "r_y0": 395.642, "r_x1": 409.014, "r_y1": 395.642, "r_x2": 409.014, "r_y2": 387.887, "r_x3": 400.23, "r_y3": 387.887, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.308, "r_y0": 395.517, "r_x1": 451.092, "r_y1": 395.517, "r_x2": 451.092, "r_y2": 387.763, "r_x3": 442.308, "r_y3": 387.763, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.219, "r_y0": 395.902, "r_x1": 487.003, "r_y1": 395.902, "r_x2": 487.003, "r_y2": 388.148, "r_x3": 478.219, "r_y3": 388.148, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 523.229, "r_y0": 395.517, "r_x1": 532.013, "r_y1": 395.517, "r_x2": 532.013, "r_y2": 387.763, "r_x3": 523.229, "r_y3": 387.763, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.572, "r_y0": 407.952, "r_x1": 420.356, "r_y1": 407.952, "r_x2": 420.356, "r_y2": 400.198, "r_x3": 411.572, "r_y3": 400.198, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.305, "r_y0": 407.564, "r_x1": 451.089, "r_y1": 407.564, "r_x2": 451.089, "r_y2": 399.81, "r_x3": 442.305, "r_y3": 399.81, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.779, "r_y0": 407.524, "r_x1": 487.563, "r_y1": 407.524, "r_x2": 487.563, "r_y2": 399.769, "r_x3": 478.779, "r_y3": 399.769, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 523.972, "r_y0": 407.139, "r_x1": 532.756, "r_y1": 407.139, "r_x2": 532.756, "r_y2": 399.385, "r_x3": 523.972, "r_y3": 399.385, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.094, "r_y0": 367.853, "r_x1": 391.099, "r_y1": 367.853, "r_x2": 391.099, "r_y2": 357.89, "r_x3": 385.094, "r_y3": 357.89, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.435, "r_y0": 390.82, "r_x1": 339.439, "r_y1": 390.82, "r_x2": 339.439, "r_y2": 380.856, "r_x3": 333.435, "r_y3": 380.856, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.072, "r_y0": 351.13, "r_x1": 484.077, "r_y1": 351.13, "r_x2": 484.077, "r_y2": 341.166, "r_x3": 478.072, "r_y3": 341.166, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 40, "label": "text", "bbox": {"l": 408.148, "t": 343.601, "r": 412.54, "b": 351.356, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.148, "r_y0": 351.356, "r_x1": 412.54, "r_y1": 351.356, "r_x2": 412.54, "r_y2": 343.601, "r_x3": 408.148, "r_y3": 343.601, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 356.11, "t": 342.345, "r": 360.503, "b": 350.099, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.11, "r_y0": 350.099, "r_x1": 360.503, "r_y1": 350.099, "r_x2": 360.503, "r_y2": 342.345, "r_x3": 356.11, "r_y3": 342.345, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 500.678, "t": 341.711, "r": 505.07, "b": 349.465, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.678, "r_y0": 349.465, "r_x1": 505.07, "r_y1": 349.465, "r_x2": 505.07, "r_y2": 341.711, "r_x3": 500.678, "r_y3": 341.711, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 356.134, "t": 352.521, "r": 360.526, "b": 360.275, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 356.134, "r_y0": 360.275, "r_x1": 360.526, "r_y1": 360.275, "r_x2": 360.526, "r_y2": 352.521, "r_x3": 356.134, "r_y3": 352.521, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 402.54, "t": 356.65, "r": 406.932, "b": 364.404, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 402.54, "r_y0": 364.404, "r_x1": 406.932, "r_y1": 364.404, "r_x2": 406.932, "r_y2": 356.65, "r_x3": 402.54, "r_y3": 356.65, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 448.582, "t": 353.613, "r": 452.974, "b": 361.367, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.582, "r_y0": 361.367, "r_x1": 452.974, "r_y1": 361.367, "r_x2": 452.974, "r_y2": 353.613, "r_x3": 448.582, "r_y3": 353.613, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 491.652, "t": 354.48, "r": 496.044, "b": 362.234, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 491.652, "r_y0": 362.234, "r_x1": 496.044, "r_y1": 362.234, "r_x2": 496.044, "r_y2": 354.48, "r_x3": 491.652, "r_y3": 354.48, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 535.138, "t": 354.113, "r": 539.531, "b": 361.867, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 535.138, "r_y0": 361.867, "r_x1": 539.531, "r_y1": 361.867, "r_x2": 539.531, "r_y2": 354.113, "r_x3": 535.138, "r_y3": 354.113, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 348.828, "t": 387.871, "r": 353.221, "b": 395.625, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.828, "r_y0": 395.625, "r_x1": 353.221, "r_y1": 395.625, "r_x2": 353.221, "r_y2": 387.871, "r_x3": 348.828, "r_y3": 387.871, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 389.272, "t": 376.145, "r": 393.664, "b": 383.9, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 389.272, "r_y0": 383.9, "r_x1": 393.664, "r_y1": 383.9, "r_x2": 393.664, "r_y2": 376.145, "r_x3": 389.272, "r_y3": 376.145, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 442.675, "t": 376.419, "r": 451.459, "b": 384.173, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.675, "r_y0": 384.173, "r_x1": 451.459, "r_y1": 384.173, "r_x2": 451.459, "r_y2": 376.419, "r_x3": 442.675, "r_y3": 376.419, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 477.438, "t": 376.307, "r": 485.902, "b": 384.061, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.438, "r_y0": 384.061, "r_x1": 485.902, "r_y1": 384.061, "r_x2": 485.902, "r_y2": 376.307, "r_x3": 477.438, "r_y3": 376.307, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 522.573, "t": 376.419, "r": 531.357, "b": 384.173, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 522.573, "r_y0": 384.173, "r_x1": 531.357, "r_y1": 384.173, "r_x2": 531.357, "r_y2": 376.419, "r_x3": 522.573, "r_y3": 376.419, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 400.23, "t": 387.887, "r": 409.014, "b": 395.642, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.23, "r_y0": 395.642, "r_x1": 409.014, "r_y1": 395.642, "r_x2": 409.014, "r_y2": 387.887, "r_x3": 400.23, "r_y3": 387.887, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 442.308, "t": 387.763, "r": 451.092, "b": 395.517, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.308, "r_y0": 395.517, "r_x1": 451.092, "r_y1": 395.517, "r_x2": 451.092, "r_y2": 387.763, "r_x3": 442.308, "r_y3": 387.763, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 478.219, "t": 388.148, "r": 487.003, "b": 395.902, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.219, "r_y0": 395.902, "r_x1": 487.003, "r_y1": 395.902, "r_x2": 487.003, "r_y2": 388.148, "r_x3": 478.219, "r_y3": 388.148, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 523.229, "t": 387.763, "r": 532.013, "b": 395.517, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 523.229, "r_y0": 395.517, "r_x1": 532.013, "r_y1": 395.517, "r_x2": 532.013, "r_y2": 387.763, "r_x3": 523.229, "r_y3": 387.763, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 411.572, "t": 400.198, "r": 420.356, "b": 407.952, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.572, "r_y0": 407.952, "r_x1": 420.356, "r_y1": 407.952, "r_x2": 420.356, "r_y2": 400.198, "r_x3": 411.572, "r_y3": 400.198, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 442.305, "t": 399.81, "r": 451.089, "b": 407.564, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.305, "r_y0": 407.564, "r_x1": 451.089, "r_y1": 407.564, "r_x2": 451.089, "r_y2": 399.81, "r_x3": 442.305, "r_y3": 399.81, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 478.779, "t": 399.769, "r": 487.563, "b": 407.524, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.779, "r_y0": 407.524, "r_x1": 487.563, "r_y1": 407.524, "r_x2": 487.563, "r_y2": 399.769, "r_x3": 478.779, "r_y3": 399.769, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 523.972, "t": 399.385, "r": 532.756, "b": 407.139, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 523.972, "r_y0": 407.139, "r_x1": 532.756, "r_y1": 407.139, "r_x2": 532.756, "r_y2": 399.385, "r_x3": 523.972, "r_y3": 399.385, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 83, "label": "text", "bbox": {"l": 385.094, "t": 357.89, "r": 391.099, "b": 367.853, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.094, "r_y0": 367.853, "r_x1": 391.099, "r_y1": 367.853, "r_x2": 391.099, "r_y2": 357.89, "r_x3": 385.094, "r_y3": 357.89, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 86, "label": "text", "bbox": {"l": 333.435, "t": 380.856, "r": 339.439, "b": 390.82, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.435, "r_y0": 390.82, "r_x1": 339.439, "r_y1": 390.82, "r_x2": 339.439, "r_y2": 380.856, "r_x3": 333.435, "r_y3": 380.856, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 88, "label": "text", "bbox": {"l": 478.072, "t": 341.166, "r": 484.077, "b": 351.13, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.072, "r_y0": 351.13, "r_x1": 484.077, "r_y1": 351.13, "r_x2": 484.077, "r_y2": 341.166, "r_x3": 478.072, "r_y3": 341.166, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 23, "page_no": 0, "cluster": {"id": 23, "label": "picture", "bbox": {"l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT"}, "confidence": 0.5088632702827454, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 446.213, "r_x1": 351.641, "r_y1": 446.213, "r_x2": 351.641, "r_y2": 438.459, "r_x3": 347.249, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.881, "r_y0": 446.213, "r_x1": 323.273, "r_y1": 446.213, "r_x2": 323.273, "r_y2": 438.459, "r_x3": 318.881, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 446.213, "r_x1": 398.497, "r_y1": 446.213, "r_x2": 398.497, "r_y2": 438.459, "r_x3": 394.104, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 458.073, "r_x1": 323.166, "r_y1": 458.073, "r_x2": 323.166, "r_y2": 450.319, "r_x3": 318.773, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 458.073, "r_x1": 351.641, "r_y1": 458.073, "r_x2": 351.641, "r_y2": 450.319, "r_x3": 347.249, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 458.073, "r_x1": 398.497, "r_y1": 458.073, "r_x2": 398.497, "r_y2": 450.319, "r_x3": 394.104, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 458.073, "r_x1": 445.352, "r_y1": 458.073, "r_x2": 445.352, "r_y2": 450.319, "r_x3": 440.959, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 458.073, "r_x1": 492.207, "r_y1": 458.073, "r_x2": 492.207, "r_y2": 450.319, "r_x3": 487.815, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 482.232, "r_x1": 323.166, "r_y1": 482.232, "r_x2": 323.166, "r_y2": 474.477, "r_x3": 318.773, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 470.372, "r_x1": 351.641, "r_y1": 470.372, "r_x2": 351.641, "r_y2": 462.618, "r_x3": 347.249, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 470.372, "r_x1": 402.888, "r_y1": 470.372, "r_x2": 402.888, "r_y2": 462.618, "r_x3": 394.104, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 470.372, "r_x1": 449.423, "r_y1": 470.372, "r_x2": 449.423, "r_y2": 462.618, "r_x3": 440.959, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 470.372, "r_x1": 496.599, "r_y1": 470.372, "r_x2": 496.599, "r_y2": 462.618, "r_x3": 487.815, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 482.232, "r_x1": 356.033, "r_y1": 482.232, "r_x2": 356.033, "r_y2": 474.477, "r_x3": 347.249, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 482.232, "r_x1": 402.888, "r_y1": 482.232, "r_x2": 402.888, "r_y2": 474.477, "r_x3": 394.104, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 482.232, "r_x1": 449.743, "r_y1": 482.232, "r_x2": 449.743, "r_y2": 474.477, "r_x3": 440.959, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 482.232, "r_x1": 496.599, "r_y1": 482.232, "r_x2": 496.599, "r_y2": 474.477, "r_x3": 487.815, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 493.652, "r_x1": 356.033, "r_y1": 493.652, "r_x2": 356.033, "r_y2": 485.898, "r_x3": 347.249, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 493.652, "r_x1": 402.888, "r_y1": 493.652, "r_x2": 402.888, "r_y2": 485.898, "r_x3": 394.104, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 493.652, "r_x1": 449.743, "r_y1": 493.652, "r_x2": 449.743, "r_y2": 485.898, "r_x3": 440.959, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 493.652, "r_x1": 496.599, "r_y1": 493.652, "r_x2": 496.599, "r_y2": 485.898, "r_x3": 487.815, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.701, "r_y0": 459.214, "r_x1": 372.706, "r_y1": 459.214, "r_x2": 372.706, "r_y2": 449.25, "r_x3": 366.701, "r_y3": 449.25, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.904, "r_y0": 483.416, "r_x1": 337.909, "r_y1": 483.416, "r_x2": 337.909, "r_y2": 473.452, "r_x3": 331.904, "r_y3": 473.452, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.876, "r_y0": 447.687, "r_x1": 465.881, "r_y1": 447.687, "r_x2": 465.881, "r_y2": 437.723, "r_x3": 459.876, "r_y3": 437.723, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 61, "label": "text", "bbox": {"l": 347.249, "t": 438.459, "r": 351.641, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 446.213, "r_x1": 351.641, "r_y1": 446.213, "r_x2": 351.641, "r_y2": 438.459, "r_x3": 347.249, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 318.881, "t": 438.459, "r": 323.273, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.881, "r_y0": 446.213, "r_x1": 323.273, "r_y1": 446.213, "r_x2": 323.273, "r_y2": 438.459, "r_x3": 318.881, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 394.104, "t": 438.459, "r": 398.497, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 446.213, "r_x1": 398.497, "r_y1": 446.213, "r_x2": 398.497, "r_y2": 438.459, "r_x3": 394.104, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 318.773, "t": 450.319, "r": 323.166, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 458.073, "r_x1": 323.166, "r_y1": 458.073, "r_x2": 323.166, "r_y2": 450.319, "r_x3": 318.773, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 347.249, "t": 450.319, "r": 351.641, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 458.073, "r_x1": 351.641, "r_y1": 458.073, "r_x2": 351.641, "r_y2": 450.319, "r_x3": 347.249, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 394.104, "t": 450.319, "r": 398.497, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 458.073, "r_x1": 398.497, "r_y1": 458.073, "r_x2": 398.497, "r_y2": 450.319, "r_x3": 394.104, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 440.959, "t": 450.319, "r": 445.352, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 458.073, "r_x1": 445.352, "r_y1": 458.073, "r_x2": 445.352, "r_y2": 450.319, "r_x3": 440.959, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 487.815, "t": 450.319, "r": 492.207, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 458.073, "r_x1": 492.207, "r_y1": 458.073, "r_x2": 492.207, "r_y2": 450.319, "r_x3": 487.815, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 318.773, "t": 474.477, "r": 323.166, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 482.232, "r_x1": 323.166, "r_y1": 482.232, "r_x2": 323.166, "r_y2": 474.477, "r_x3": 318.773, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 347.249, "t": 462.618, "r": 351.641, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 470.372, "r_x1": 351.641, "r_y1": 470.372, "r_x2": 351.641, "r_y2": 462.618, "r_x3": 347.249, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 394.104, "t": 462.618, "r": 402.888, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 470.372, "r_x1": 402.888, "r_y1": 470.372, "r_x2": 402.888, "r_y2": 462.618, "r_x3": 394.104, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 440.959, "t": 462.618, "r": 449.423, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 470.372, "r_x1": 449.423, "r_y1": 470.372, "r_x2": 449.423, "r_y2": 462.618, "r_x3": 440.959, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 487.815, "t": 462.618, "r": 496.599, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 470.372, "r_x1": 496.599, "r_y1": 470.372, "r_x2": 496.599, "r_y2": 462.618, "r_x3": 487.815, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 347.249, "t": 474.477, "r": 356.033, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 482.232, "r_x1": 356.033, "r_y1": 482.232, "r_x2": 356.033, "r_y2": 474.477, "r_x3": 347.249, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 394.104, "t": 474.477, "r": 402.888, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 482.232, "r_x1": 402.888, "r_y1": 482.232, "r_x2": 402.888, "r_y2": 474.477, "r_x3": 394.104, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 440.959, "t": 474.477, "r": 449.743, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 482.232, "r_x1": 449.743, "r_y1": 482.232, "r_x2": 449.743, "r_y2": 474.477, "r_x3": 440.959, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 487.815, "t": 474.477, "r": 496.599, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 482.232, "r_x1": 496.599, "r_y1": 482.232, "r_x2": 496.599, "r_y2": 474.477, "r_x3": 487.815, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 347.249, "t": 485.898, "r": 356.033, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 493.652, "r_x1": 356.033, "r_y1": 493.652, "r_x2": 356.033, "r_y2": 485.898, "r_x3": 347.249, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 394.104, "t": 485.898, "r": 402.888, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 493.652, "r_x1": 402.888, "r_y1": 493.652, "r_x2": 402.888, "r_y2": 485.898, "r_x3": 394.104, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 440.959, "t": 485.898, "r": 449.743, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 493.652, "r_x1": 449.743, "r_y1": 493.652, "r_x2": 449.743, "r_y2": 485.898, "r_x3": 440.959, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 487.815, "t": 485.898, "r": 496.599, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 493.652, "r_x1": 496.599, "r_y1": 493.652, "r_x2": 496.599, "r_y2": 485.898, "r_x3": 487.815, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 366.701, "t": 449.25, "r": 372.706, "b": 459.214, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.701, "r_y0": 459.214, "r_x1": 372.706, "r_y1": 459.214, "r_x2": 372.706, "r_y2": 449.25, "r_x3": 366.701, "r_y3": 449.25, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 331.904, "t": 473.452, "r": 337.909, "b": 483.416, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.904, "r_y0": 483.416, "r_x1": 337.909, "r_y1": 483.416, "r_x2": 337.909, "r_y2": 473.452, "r_x3": 331.904, "r_y3": 473.452, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 459.876, "t": 437.723, "r": 465.881, "b": 447.687, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.876, "r_y0": 447.687, "r_x1": 465.881, "r_y1": 447.687, "r_x2": 465.881, "r_y2": 437.723, "r_x3": 459.876, "r_y3": 437.723, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 11, "page_no": 0, "cluster": {"id": 11, "label": "table", "bbox": {"l": 315.7172546386719, "t": 433.823486328125, "r": 536.835693359375, "b": 496.0290222167969, "coord_origin": "TOPLEFT"}, "confidence": 0.8056110739707947, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 446.213, "r_x1": 351.641, "r_y1": 446.213, "r_x2": 351.641, "r_y2": 438.459, "r_x3": 347.249, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.881, "r_y0": 446.213, "r_x1": 323.273, "r_y1": 446.213, "r_x2": 323.273, "r_y2": 438.459, "r_x3": 318.881, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 446.213, "r_x1": 398.497, "r_y1": 446.213, "r_x2": 398.497, "r_y2": 438.459, "r_x3": 394.104, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 458.073, "r_x1": 323.166, "r_y1": 458.073, "r_x2": 323.166, "r_y2": 450.319, "r_x3": 318.773, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 458.073, "r_x1": 351.641, "r_y1": 458.073, "r_x2": 351.641, "r_y2": 450.319, "r_x3": 347.249, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 458.073, "r_x1": 398.497, "r_y1": 458.073, "r_x2": 398.497, "r_y2": 450.319, "r_x3": 394.104, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 458.073, "r_x1": 445.352, "r_y1": 458.073, "r_x2": 445.352, "r_y2": 450.319, "r_x3": 440.959, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 458.073, "r_x1": 492.207, "r_y1": 458.073, "r_x2": 492.207, "r_y2": 450.319, "r_x3": 487.815, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 482.232, "r_x1": 323.166, "r_y1": 482.232, "r_x2": 323.166, "r_y2": 474.477, "r_x3": 318.773, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 470.372, "r_x1": 351.641, "r_y1": 470.372, "r_x2": 351.641, "r_y2": 462.618, "r_x3": 347.249, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 470.372, "r_x1": 402.888, "r_y1": 470.372, "r_x2": 402.888, "r_y2": 462.618, "r_x3": 394.104, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 470.372, "r_x1": 449.423, "r_y1": 470.372, "r_x2": 449.423, "r_y2": 462.618, "r_x3": 440.959, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 470.372, "r_x1": 496.599, "r_y1": 470.372, "r_x2": 496.599, "r_y2": 462.618, "r_x3": 487.815, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 482.232, "r_x1": 356.033, "r_y1": 482.232, "r_x2": 356.033, "r_y2": 474.477, "r_x3": 347.249, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 482.232, "r_x1": 402.888, "r_y1": 482.232, "r_x2": 402.888, "r_y2": 474.477, "r_x3": 394.104, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 482.232, "r_x1": 449.743, "r_y1": 482.232, "r_x2": 449.743, "r_y2": 474.477, "r_x3": 440.959, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 482.232, "r_x1": 496.599, "r_y1": 482.232, "r_x2": 496.599, "r_y2": 474.477, "r_x3": 487.815, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 493.652, "r_x1": 356.033, "r_y1": 493.652, "r_x2": 356.033, "r_y2": 485.898, "r_x3": 347.249, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 493.652, "r_x1": 402.888, "r_y1": 493.652, "r_x2": 402.888, "r_y2": 485.898, "r_x3": 394.104, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 493.652, "r_x1": 449.743, "r_y1": 493.652, "r_x2": 449.743, "r_y2": 485.898, "r_x3": 440.959, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 493.652, "r_x1": 496.599, "r_y1": 493.652, "r_x2": 496.599, "r_y2": 485.898, "r_x3": 487.815, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.701, "r_y0": 459.214, "r_x1": 372.706, "r_y1": 459.214, "r_x2": 372.706, "r_y2": 449.25, "r_x3": 366.701, "r_y3": 449.25, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.904, "r_y0": 483.416, "r_x1": 337.909, "r_y1": 483.416, "r_x2": 337.909, "r_y2": 473.452, "r_x3": 331.904, "r_y3": 473.452, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.876, "r_y0": 447.687, "r_x1": 465.881, "r_y1": 447.687, "r_x2": 465.881, "r_y2": 437.723, "r_x3": 459.876, "r_y3": 437.723, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 61, "label": "text", "bbox": {"l": 347.249, "t": 438.459, "r": 351.641, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 446.213, "r_x1": 351.641, "r_y1": 446.213, "r_x2": 351.641, "r_y2": 438.459, "r_x3": 347.249, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 318.881, "t": 438.459, "r": 323.273, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.881, "r_y0": 446.213, "r_x1": 323.273, "r_y1": 446.213, "r_x2": 323.273, "r_y2": 438.459, "r_x3": 318.881, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 394.104, "t": 438.459, "r": 398.497, "b": 446.213, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 446.213, "r_x1": 398.497, "r_y1": 446.213, "r_x2": 398.497, "r_y2": 438.459, "r_x3": 394.104, "r_y3": 438.459, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 318.773, "t": 450.319, "r": 323.166, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 458.073, "r_x1": 323.166, "r_y1": 458.073, "r_x2": 323.166, "r_y2": 450.319, "r_x3": 318.773, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 347.249, "t": 450.319, "r": 351.641, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 458.073, "r_x1": 351.641, "r_y1": 458.073, "r_x2": 351.641, "r_y2": 450.319, "r_x3": 347.249, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 394.104, "t": 450.319, "r": 398.497, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 458.073, "r_x1": 398.497, "r_y1": 458.073, "r_x2": 398.497, "r_y2": 450.319, "r_x3": 394.104, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 440.959, "t": 450.319, "r": 445.352, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 458.073, "r_x1": 445.352, "r_y1": 458.073, "r_x2": 445.352, "r_y2": 450.319, "r_x3": 440.959, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 487.815, "t": 450.319, "r": 492.207, "b": 458.073, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 458.073, "r_x1": 492.207, "r_y1": 458.073, "r_x2": 492.207, "r_y2": 450.319, "r_x3": 487.815, "r_y3": 450.319, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 318.773, "t": 474.477, "r": 323.166, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.773, "r_y0": 482.232, "r_x1": 323.166, "r_y1": 482.232, "r_x2": 323.166, "r_y2": 474.477, "r_x3": 318.773, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 347.249, "t": 462.618, "r": 351.641, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 470.372, "r_x1": 351.641, "r_y1": 470.372, "r_x2": 351.641, "r_y2": 462.618, "r_x3": 347.249, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 394.104, "t": 462.618, "r": 402.888, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 470.372, "r_x1": 402.888, "r_y1": 470.372, "r_x2": 402.888, "r_y2": 462.618, "r_x3": 394.104, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 440.959, "t": 462.618, "r": 449.423, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 470.372, "r_x1": 449.423, "r_y1": 470.372, "r_x2": 449.423, "r_y2": 462.618, "r_x3": 440.959, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 487.815, "t": 462.618, "r": 496.599, "b": 470.372, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 470.372, "r_x1": 496.599, "r_y1": 470.372, "r_x2": 496.599, "r_y2": 462.618, "r_x3": 487.815, "r_y3": 462.618, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 347.249, "t": 474.477, "r": 356.033, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 482.232, "r_x1": 356.033, "r_y1": 482.232, "r_x2": 356.033, "r_y2": 474.477, "r_x3": 347.249, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 394.104, "t": 474.477, "r": 402.888, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 482.232, "r_x1": 402.888, "r_y1": 482.232, "r_x2": 402.888, "r_y2": 474.477, "r_x3": 394.104, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 440.959, "t": 474.477, "r": 449.743, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 482.232, "r_x1": 449.743, "r_y1": 482.232, "r_x2": 449.743, "r_y2": 474.477, "r_x3": 440.959, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 487.815, "t": 474.477, "r": 496.599, "b": 482.232, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 482.232, "r_x1": 496.599, "r_y1": 482.232, "r_x2": 496.599, "r_y2": 474.477, "r_x3": 487.815, "r_y3": 474.477, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 347.249, "t": 485.898, "r": 356.033, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.249, "r_y0": 493.652, "r_x1": 356.033, "r_y1": 493.652, "r_x2": 356.033, "r_y2": 485.898, "r_x3": 347.249, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 394.104, "t": 485.898, "r": 402.888, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.104, "r_y0": 493.652, "r_x1": 402.888, "r_y1": 493.652, "r_x2": 402.888, "r_y2": 485.898, "r_x3": 394.104, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 440.959, "t": 485.898, "r": 449.743, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.959, "r_y0": 493.652, "r_x1": 449.743, "r_y1": 493.652, "r_x2": 449.743, "r_y2": 485.898, "r_x3": 440.959, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 487.815, "t": 485.898, "r": 496.599, "b": 493.652, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.815, "r_y0": 493.652, "r_x1": 496.599, "r_y1": 493.652, "r_x2": 496.599, "r_y2": 485.898, "r_x3": 487.815, "r_y3": 485.898, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 366.701, "t": 449.25, "r": 372.706, "b": 459.214, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.701, "r_y0": 459.214, "r_x1": 372.706, "r_y1": 459.214, "r_x2": 372.706, "r_y2": 449.25, "r_x3": 366.701, "r_y3": 449.25, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 331.904, "t": 473.452, "r": 337.909, "b": 483.416, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.904, "r_y0": 483.416, "r_x1": 337.909, "r_y1": 483.416, "r_x2": 337.909, "r_y2": 473.452, "r_x3": 331.904, "r_y3": 473.452, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 459.876, "t": 437.723, "r": 465.881, "b": 447.687, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.876, "r_y0": 447.687, "r_x1": 465.881, "r_y1": 447.687, "r_x2": 465.881, "r_y2": 437.723, "r_x3": 459.876, "r_y3": 437.723, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["fcel", "fcel", "lcel", "lcel", "lcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 5, "num_cols": 5, "table_cells": [{"bbox": {"l": 347.249, "t": 437.723, "r": 465.881, "b": 447.687, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 4, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 5, "text": "1 2 1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 318.881, "t": 438.459, "r": 323.273, "b": 446.213, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 318.773, "t": 450.319, "r": 323.166, "b": 458.073, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 347.249, "t": 449.25, "r": 372.706, "b": 459.214, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "4 3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.104, "t": 450.319, "r": 398.497, "b": 458.073, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "5", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 440.959, "t": 450.319, "r": 445.352, "b": 458.073, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "6", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 487.815, "t": 450.319, "r": 492.207, "b": 458.073, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "7", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 318.773, "t": 473.452, "r": 337.909, "b": 483.416, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "8 2", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 347.249, "t": 462.618, "r": 351.641, "b": 470.372, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "9", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.104, "t": 462.618, "r": 402.888, "b": 470.372, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "10", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 440.959, "t": 462.618, "r": 449.423, "b": 470.372, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "11", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 487.815, "t": 462.618, "r": 496.599, "b": 470.372, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "12", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 347.249, "t": 474.477, "r": 356.033, "b": 482.232, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "13", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.104, "t": 474.477, "r": 402.888, "b": 482.232, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "14", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 440.959, "t": 474.477, "r": 449.743, "b": 482.232, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "15", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 487.815, "t": 474.477, "r": 496.599, "b": 482.232, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "16", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 347.249, "t": 485.898, "r": 356.033, "b": 493.652, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "17", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 394.104, "t": 485.898, "r": 402.888, "b": 493.652, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "18", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 440.959, "t": 485.898, "r": 449.743, "b": 493.652, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "19", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 487.815, "t": 485.898, "r": 496.599, "b": 493.652, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "20", "column_header": false, "row_header": false, "row_section": false}]}, {"label": "picture", "id": 16, "page_no": 0, "cluster": {"id": 16, "label": "picture", "bbox": {"l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT"}, "confidence": 0.608779788017273, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.946, "r_y0": 245.44000000000005, "r_x1": 457.951, "r_y1": 245.44000000000005, "r_x2": 457.951, "r_y2": 235.47699999999998, "r_x3": 451.946, "r_y3": 235.47699999999998, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.197, "r_y0": 279.446, "r_x1": 337.202, "r_y1": 279.446, "r_x2": 337.202, "r_y2": 269.48199999999997, "r_x3": 331.197, "r_y3": 269.48199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.033, "r_y0": 262.77200000000005, "r_x1": 390.038, "r_y1": 262.77200000000005, "r_x2": 390.038, "r_y2": 252.80899999999997, "r_x3": 384.033, "r_y3": 252.80899999999997, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 82, "label": "text", "bbox": {"l": 451.946, "t": 235.47699999999998, "r": 457.951, "b": 245.44000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.946, "r_y0": 245.44000000000005, "r_x1": 457.951, "r_y1": 245.44000000000005, "r_x2": 457.951, "r_y2": 235.47699999999998, "r_x3": 451.946, "r_y3": 235.47699999999998, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 331.197, "t": 269.48199999999997, "r": 337.202, "b": 279.446, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.197, "r_y0": 279.446, "r_x1": 337.202, "r_y1": 279.446, "r_x2": 337.202, "r_y2": 269.48199999999997, "r_x3": 331.197, "r_y3": 269.48199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 384.033, "t": 252.80899999999997, "r": 390.038, "b": 262.77200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.033, "r_y0": 262.77200000000005, "r_x1": 390.038, "r_y1": 262.77200000000005, "r_x2": 390.038, "r_y2": 252.80899999999997, "r_x3": 384.033, "r_y3": 252.80899999999997, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 15, "page_no": 0, "cluster": {"id": 15, "label": "table", "bbox": {"l": 315.65362548828125, "t": 228.723388671875, "r": 537.1475219726562, "b": 302.8014221191406, "coord_origin": "TOPLEFT"}, "confidence": 0.6515864729881287, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.946, "r_y0": 245.44000000000005, "r_x1": 457.951, "r_y1": 245.44000000000005, "r_x2": 457.951, "r_y2": 235.47699999999998, "r_x3": 451.946, "r_y3": 235.47699999999998, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.197, "r_y0": 279.446, "r_x1": 337.202, "r_y1": 279.446, "r_x2": 337.202, "r_y2": 269.48199999999997, "r_x3": 331.197, "r_y3": 269.48199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.033, "r_y0": 262.77200000000005, "r_x1": 390.038, "r_y1": 262.77200000000005, "r_x2": 390.038, "r_y2": 252.80899999999997, "r_x3": 384.033, "r_y3": 252.80899999999997, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 82, "label": "text", "bbox": {"l": 451.946, "t": 235.47699999999998, "r": 457.951, "b": 245.44000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 451.946, "r_y0": 245.44000000000005, "r_x1": 457.951, "r_y1": 245.44000000000005, "r_x2": 457.951, "r_y2": 235.47699999999998, "r_x3": 451.946, "r_y3": 235.47699999999998, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 331.197, "t": 269.48199999999997, "r": 337.202, "b": 279.446, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.197, "r_y0": 279.446, "r_x1": 337.202, "r_y1": 279.446, "r_x2": 337.202, "r_y2": 269.48199999999997, "r_x3": 331.197, "r_y3": 269.48199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 384.033, "t": 252.80899999999997, "r": 390.038, "b": 262.77200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.033, "r_y0": 262.77200000000005, "r_x1": 390.038, "r_y1": 262.77200000000005, "r_x2": 390.038, "r_y2": 252.80899999999997, "r_x3": 384.033, "r_y3": 252.80899999999997, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl", "ucel", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 1, "num_cols": 1, "table_cells": [{"bbox": {"l": 451.946, "t": 235.47699999999998, "r": 457.951, "b": 245.44000000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "1", "column_header": true, "row_header": false, "row_section": false}]}, {"label": "caption", "id": 6, "page_no": 0, "cluster": {"id": 6, "label": "caption", "bbox": {"l": 308.862, "t": 514.769, "r": 545.115, "b": 559.187, "coord_origin": "TOPLEFT"}, "confidence": 0.9214619398117065, "cells": [{"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 523.321, "r_x1": 345.734, "r_y1": 523.321, "r_x2": 345.734, "r_y2": 514.769, "r_x3": 308.862, "r_y3": 514.769, "coord_origin": "TOPLEFT"}, "text": "Figure 1:", "orig": "Figure 1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 353.176, "r_y0": 523.321, "r_x1": 545.115, "r_y1": 523.321, "r_x2": 545.115, "r_y2": 514.769, "r_x3": 353.176, "r_y3": 514.769, "coord_origin": "TOPLEFT"}, "text": "Picture of a table with subtle, complex features", "orig": "Picture of a table with subtle, complex features", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 535.2760000000001, "r_x1": 545.115, "r_y1": 535.2760000000001, "r_x2": 545.115, "r_y2": 526.7239999999999, "r_x3": 308.862, "r_y3": 526.7239999999999, "coord_origin": "TOPLEFT"}, "text": "such as (1) multi-column headers, (2) cell with multi-row", "orig": "such as (1) multi-column headers, (2) cell with multi-row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 547.231, "r_x1": 445.539, "r_y1": 547.231, "r_x2": 445.539, "r_y2": 538.679, "r_x3": 308.862, "r_y3": 538.679, "coord_origin": "TOPLEFT"}, "text": "text and (3) cells with no content.", "orig": "text and (3) cells with no content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.221, "r_y0": 547.231, "r_x1": 545.115, "r_y1": 547.231, "r_x2": 545.115, "r_y2": 538.679, "r_x3": 450.221, "r_y3": 538.679, "coord_origin": "TOPLEFT"}, "text": "Image from PubTabNet", "orig": "Image from PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 559.187, "r_x1": 505.692, "r_y1": 559.187, "r_x2": 505.692, "r_y2": 550.635, "r_x3": 308.862, "r_y3": 550.635, "coord_origin": "TOPLEFT"}, "text": "evaluation set, filename: 'PMC2944238 004 02'.", "orig": "evaluation set, filename: 'PMC2944238 004 02'.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 1: Picture of a table with subtle, complex features such as (1) multi-column headers, (2) cell with multi-row text and (3) cells with no content. Image from PubTabNet evaluation set, filename: 'PMC2944238 004 02'."}, {"label": "text", "id": 0, "page_no": 0, "cluster": {"id": 0, "label": "text", "bbox": {"l": 308.862, "t": 584.678, "r": 545.115, "b": 664.961, "coord_origin": "TOPLEFT"}, "confidence": 0.9848759770393372, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 593.23, "r_x1": 358.077, "r_y1": 593.23, "r_x2": 358.077, "r_y2": 584.678, "r_x3": 320.817, "r_y3": 584.678, "coord_origin": "TOPLEFT"}, "text": "Recently,", "orig": "Recently,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.62, "r_y0": 593.23, "r_x1": 404.134, "r_y1": 593.23, "r_x2": 404.134, "r_y2": 584.678, "r_x3": 362.62, "r_y3": 584.678, "coord_origin": "TOPLEFT"}, "text": "significant", "orig": "significant", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.259, "r_y0": 593.23, "r_x1": 545.115, "r_y1": 593.23, "r_x2": 545.115, "r_y2": 584.678, "r_x3": 408.259, "r_y3": 584.678, "coord_origin": "TOPLEFT"}, "text": "progress has been made with vi-", "orig": "progress has been made with vi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.185, "r_x1": 526.365, "r_y1": 605.185, "r_x2": 526.365, "r_y2": 596.633, "r_x3": 308.862, "r_y3": 596.633, "coord_origin": "TOPLEFT"}, "text": "sion based approaches to extract tables in documents.", "orig": "sion based approaches to extract tables in documents.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 531.426, "r_y0": 605.185, "r_x1": 545.115, "r_y1": 605.185, "r_x2": 545.115, "r_y2": 596.633, "r_x3": 531.426, "r_y3": 596.633, "coord_origin": "TOPLEFT"}, "text": "For", "orig": "For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.14, "r_x1": 545.115, "r_y1": 617.14, "r_x2": 545.115, "r_y2": 608.588, "r_x3": 308.862, "r_y3": 608.588, "coord_origin": "TOPLEFT"}, "text": "the sake of completeness, the issue of table extraction from", "orig": "the sake of completeness, the issue of table extraction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.095, "r_x1": 545.115, "r_y1": 629.095, "r_x2": 545.115, "r_y2": 620.543, "r_x3": 308.862, "r_y3": 620.543, "coord_origin": "TOPLEFT"}, "text": "documents is typically decomposed into two separate chal-", "orig": "documents is typically decomposed into two separate chal-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.0509999999999, "r_x1": 336.807, "r_y1": 641.0509999999999, "r_x2": 336.807, "r_y2": 632.499, "r_x3": 308.862, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "lenges,", "orig": "lenges,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.519, "r_y0": 641.0509999999999, "r_x1": 353.694, "r_y1": 641.0509999999999, "r_x2": 353.694, "r_y2": 632.499, "r_x3": 341.519, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "i.e.", "orig": "i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.112, "r_y0": 641.0509999999999, "r_x1": 373.728, "r_y1": 641.0509999999999, "r_x2": 373.728, "r_y2": 632.499, "r_x3": 362.112, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.992, "r_y0": 641.0509999999999, "r_x1": 406.226, "r_y1": 641.0509999999999, "r_x2": 406.226, "r_y2": 632.499, "r_x3": 377.992, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "finding", "orig": "finding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.5, "r_y0": 641.0509999999999, "r_x1": 422.675, "r_y1": 641.0509999999999, "r_x2": 422.675, "r_y2": 632.499, "r_x3": 410.5, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.939, "r_y0": 641.0509999999999, "r_x1": 459.038, "r_y1": 641.0509999999999, "r_x2": 459.038, "r_y2": 632.499, "r_x3": 426.939, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "location", "orig": "location", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.302, "r_y0": 641.0509999999999, "r_x1": 471.601, "r_y1": 641.0509999999999, "r_x2": 471.601, "r_y2": 632.499, "r_x3": 463.302, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.875, "r_y0": 641.0509999999999, "r_x1": 488.049, "r_y1": 641.0509999999999, "r_x2": 488.049, "r_y2": 632.499, "r_x3": 475.875, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 492.313, "r_y0": 641.0509999999999, "r_x1": 522.191, "r_y1": 641.0509999999999, "r_x2": 522.191, "r_y2": 632.499, "r_x3": 492.313, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "table(s)", "orig": "table(s)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 526.455, "r_y0": 641.0509999999999, "r_x1": 545.115, "r_y1": 641.0509999999999, "r_x2": 545.115, "r_y2": 632.499, "r_x3": 526.455, "r_y3": 632.499, "coord_origin": "TOPLEFT"}, "text": "on a", "orig": "on a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.006, "r_x1": 545.115, "r_y1": 653.006, "r_x2": 545.115, "r_y2": 644.454, "r_x3": 308.862, "r_y3": 644.454, "coord_origin": "TOPLEFT"}, "text": "document-page and (2) finding the structure of a given table", "orig": "document-page and (2) finding the structure of a given table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 664.961, "r_x1": 375.552, "r_y1": 664.961, "r_x2": 375.552, "r_y2": 656.409, "r_x3": 308.862, "r_y3": 656.409, "coord_origin": "TOPLEFT"}, "text": "in the document.", "orig": "in the document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Recently, significant progress has been made with vision based approaches to extract tables in documents. For the sake of completeness, the issue of table extraction from documents is typically decomposed into two separate challenges, i.e. (1) finding the location of the table(s) on a document-page and (2) finding the structure of a given table in the document."}, {"label": "text", "id": 3, "page_no": 0, "cluster": {"id": 3, "label": "text", "bbox": {"l": 308.862, "t": 668.649, "r": 545.115, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.979152262210846, "cells": [{"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 320.817, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "The first problem is called table-location and has been", "orig": "The first problem is called table-location and has been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 308.862, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "orig": "previously addressed [30, 38, 19, 21, 23, 26, 8] with state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 474.261, "r_y1": 701.111, "r_x2": 474.261, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "of-the-art object-detection networks (e.g.", "orig": "of-the-art object-detection networks (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 479.342, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 479.342, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "YOLO and later", "orig": "YOLO and later", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 395.796, "r_y1": 713.066, "r_x2": 395.796, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "on Mask-RCNN [9]).", "orig": "on Mask-RCNN [9]).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.046, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 401.046, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "For all practical purposes, it can be", "orig": "For all practical purposes, it can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The first problem is called table-location and has been previously addressed [30, 38, 19, 21, 23, 26, 8] with stateof-the-art object-detection networks (e.g. YOLO and later on Mask-RCNN [9]). For all practical purposes, it can be"}, {"label": "text", "id": 91, "page_no": 0, "cluster": {"id": 91, "label": "text", "bbox": {"l": 18.34, "t": 160.0, "r": 36.34, "b": 200.0, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 200.0, "r_x1": 36.34, "r_y1": 160.0, "r_x2": 18.34, "r_y2": 160.0, "r_x3": 18.34, "r_y3": 200.0, "coord_origin": "TOPLEFT"}, "text": "2022", "orig": "2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2022"}], "headers": [{"label": "page_footer", "id": 12, "page_no": 0, "cluster": {"id": 12, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8045893311500549, "cells": [{"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1"}, {"label": "page_header", "id": 9, "page_no": 0, "cluster": {"id": 9, "label": "page_header", "bbox": {"l": 18.34, "t": 210.0, "r": 36.34, "b": 560.0, "coord_origin": "TOPLEFT"}, "confidence": 0.8773143887519836, "cells": [{"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 560.0, "r_x1": 36.34, "r_y1": 380.0, "r_x2": 18.34, "r_y2": 380.0, "r_x3": 18.34, "r_y3": 560.0, "coord_origin": "TOPLEFT"}, "text": "arXiv:2203.01017v2", "orig": "arXiv:2203.01017v2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 360.0, "r_x1": 36.34, "r_y1": 290.0, "r_x2": 18.34, "r_y2": 290.0, "r_x3": 18.34, "r_y3": 360.0, "coord_origin": "TOPLEFT"}, "text": "[cs.CV]", "orig": "[cs.CV]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 270.0, "r_x1": 36.34, "r_y1": 250.0, "r_x2": 18.34, "r_y2": 250.0, "r_x3": 18.34, "r_y3": 270.0, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 36.34, "r_y0": 240.0, "r_x1": 36.34, "r_y1": 210.0, "r_x2": 18.34, "r_y2": 210.0, "r_x3": 18.34, "r_y3": 240.0, "coord_origin": "TOPLEFT"}, "text": "Mar", "orig": "Mar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "arXiv:2203.01017v2 [cs.CV] 11 Mar"}]}}, {"page_no": 1, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "considered as a solved problem, given enough ground-truth", "orig": "considered as a solved problem, given enough ground-truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 95.98400000000004, "r_x1": 112.647, "r_y1": 95.98400000000004, "r_x2": 112.647, "r_y2": 87.43200000000002, "r_x3": 50.112, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "data to train on.", "orig": "data to train on.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 108.39200000000005, "r_x1": 286.365, "r_y1": 108.39200000000005, "r_x2": 286.365, "r_y2": 99.84000000000003, "r_x3": 62.067, "r_y3": 99.84000000000003, "coord_origin": "TOPLEFT"}, "text": "The second problem is called table-structure decompo-", "orig": "The second problem is called table-structure decompo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 120.34699999999998, "r_x1": 74.75, "r_y1": 120.34699999999998, "r_x2": 74.75, "r_y2": 111.79499999999996, "r_x3": 50.112, "r_y3": 111.79499999999996, "coord_origin": "TOPLEFT"}, "text": "sition.", "orig": "sition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.335, "r_y0": 120.34699999999998, "r_x1": 286.365, "r_y1": 120.34699999999998, "r_x2": 286.365, "r_y2": 111.79499999999996, "r_x3": 81.335, "r_y3": 111.79499999999996, "coord_origin": "TOPLEFT"}, "text": "The latter is a long standing problem in the com-", "orig": "The latter is a long standing problem in the com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 132.30200000000002, "r_x1": 235.117, "r_y1": 132.30200000000002, "r_x2": 235.117, "r_y2": 123.75, "r_x3": 50.112, "r_y3": 123.75, "coord_origin": "TOPLEFT"}, "text": "munity of document understanding [6, 4, 14].", "orig": "munity of document understanding [6, 4, 14].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.079, "r_y0": 132.30200000000002, "r_x1": 286.365, "r_y1": 132.30200000000002, "r_x2": 286.365, "r_y2": 123.75, "r_x3": 240.079, "r_y3": 123.75, "coord_origin": "TOPLEFT"}, "text": "Contrary to", "orig": "Contrary to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 144.25699999999995, "r_x1": 286.365, "r_y1": 144.25699999999995, "r_x2": 286.365, "r_y2": 135.70500000000004, "r_x3": 50.112, "r_y3": 135.70500000000004, "coord_origin": "TOPLEFT"}, "text": "the table-location problem, there are no commonly used ap-", "orig": "the table-location problem, there are no commonly used ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 156.21299999999997, "r_x1": 286.365, "r_y1": 156.21299999999997, "r_x2": 286.365, "r_y2": 147.66099999999994, "r_x3": 50.112, "r_y3": 147.66099999999994, "coord_origin": "TOPLEFT"}, "text": "proaches that can easily be re-purposed to solve this prob-", "orig": "proaches that can easily be re-purposed to solve this prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 168.168, "r_x1": 286.365, "r_y1": 168.168, "r_x2": 286.365, "r_y2": 159.61599999999999, "r_x3": 50.112, "r_y3": 159.61599999999999, "coord_origin": "TOPLEFT"}, "text": "lem. Lately, a set of new model-architectures has been pro-", "orig": "lem. Lately, a set of new model-architectures has been pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 180.12300000000005, "r_x1": 286.365, "r_y1": 180.12300000000005, "r_x2": 286.365, "r_y2": 171.57100000000003, "r_x3": 50.112, "r_y3": 171.57100000000003, "coord_origin": "TOPLEFT"}, "text": "posed by the community to address table-structure decom-", "orig": "posed by the community to address table-structure decom-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 192.07799999999997, "r_x1": 286.365, "r_y1": 192.07799999999997, "r_x2": 286.365, "r_y2": 183.52599999999995, "r_x3": 50.112, "r_y3": 183.52599999999995, "coord_origin": "TOPLEFT"}, "text": "position [37, 36, 18, 20]. All these models have some weak-", "orig": "position [37, 36, 18, 20]. All these models have some weak-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 204.03300000000002, "r_x1": 114.51, "r_y1": 204.03300000000002, "r_x2": 114.51, "r_y2": 195.481, "r_x3": 50.112, "r_y3": 195.481, "coord_origin": "TOPLEFT"}, "text": "nesses (see Sec.", "orig": "nesses (see Sec.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.163, "r_y0": 204.03300000000002, "r_x1": 129.952, "r_y1": 204.03300000000002, "r_x2": 129.952, "r_y2": 195.481, "r_x3": 119.163, "r_y3": 195.481, "coord_origin": "TOPLEFT"}, "text": "2).", "orig": "2).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.615, "r_y0": 204.03300000000002, "r_x1": 286.365, "r_y1": 204.03300000000002, "r_x2": 286.365, "r_y2": 195.481, "r_x3": 134.615, "r_y3": 195.481, "coord_origin": "TOPLEFT"}, "text": "The common denominator here is the", "orig": "The common denominator here is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 215.98800000000006, "r_x1": 286.365, "r_y1": 215.98800000000006, "r_x2": 286.365, "r_y2": 207.43600000000004, "r_x3": 50.112, "r_y3": 207.43600000000004, "coord_origin": "TOPLEFT"}, "text": "reliance on textual features and/or the inability to provide", "orig": "reliance on textual features and/or the inability to provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 227.94399999999996, "r_x1": 278.664, "r_y1": 227.94399999999996, "r_x2": 278.664, "r_y2": 219.39200000000005, "r_x3": 50.112, "r_y3": 219.39200000000005, "coord_origin": "TOPLEFT"}, "text": "the bounding box of each table-cell in the original image.", "orig": "the bounding box of each table-cell in the original image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 240.35199999999998, "r_x1": 286.365, "r_y1": 240.35199999999998, "r_x2": 286.365, "r_y2": 231.79999999999995, "r_x3": 62.067, "r_y3": 231.79999999999995, "coord_origin": "TOPLEFT"}, "text": "In this paper, we want to address these weaknesses and", "orig": "In this paper, we want to address these weaknesses and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 252.30700000000002, "r_x1": 78.884, "r_y1": 252.30700000000002, "r_x2": 78.884, "r_y2": 243.755, "r_x3": 50.112, "r_y3": 243.755, "coord_origin": "TOPLEFT"}, "text": "present", "orig": "present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 83.068, "r_y0": 252.30700000000002, "r_x1": 116.373, "r_y1": 252.30700000000002, "r_x2": 116.373, "r_y2": 243.755, "r_x3": 83.068, "r_y3": 243.755, "coord_origin": "TOPLEFT"}, "text": "a robust", "orig": "a robust", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 120.558, "r_y0": 252.30700000000002, "r_x1": 178.102, "r_y1": 252.30700000000002, "r_x2": 178.102, "r_y2": 243.755, "r_x3": 120.558, "r_y3": 243.755, "coord_origin": "TOPLEFT"}, "text": "table-structure", "orig": "table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.276, "r_y0": 252.30700000000002, "r_x1": 286.365, "r_y1": 252.30700000000002, "r_x2": 286.365, "r_y2": 243.755, "r_x3": 182.276, "r_y3": 243.755, "coord_origin": "TOPLEFT"}, "text": "decomposition algorithm.", "orig": "decomposition algorithm.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 264.26199999999994, "r_x1": 260.432, "r_y1": 264.26199999999994, "r_x2": 260.432, "r_y2": 255.71000000000004, "r_x3": 50.112, "r_y3": 255.71000000000004, "coord_origin": "TOPLEFT"}, "text": "The design criteria for our model are the following.", "orig": "The design criteria for our model are the following.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.603, "r_y0": 264.26199999999994, "r_x1": 286.365, "r_y1": 264.26199999999994, "r_x2": 286.365, "r_y2": 255.71000000000004, "r_x3": 265.603, "r_y3": 255.71000000000004, "coord_origin": "TOPLEFT"}, "text": "First,", "orig": "First,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 276.217, "r_x1": 286.365, "r_y1": 276.217, "r_x2": 286.365, "r_y2": 267.66499999999996, "r_x3": 50.112, "r_y3": 267.66499999999996, "coord_origin": "TOPLEFT"}, "text": "we want our algorithm to be language agnostic. In this way,", "orig": "we want our algorithm to be language agnostic. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 288.172, "r_x1": 286.365, "r_y1": 288.172, "r_x2": 286.365, "r_y2": 279.62, "r_x3": 50.112, "r_y3": 279.62, "coord_origin": "TOPLEFT"}, "text": "we can obtain the structure of any table, irregardless of the", "orig": "we can obtain the structure of any table, irregardless of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 300.128, "r_x1": 88.568, "r_y1": 300.128, "r_x2": 88.568, "r_y2": 291.576, "r_x3": 50.112, "r_y3": 291.576, "coord_origin": "TOPLEFT"}, "text": "language.", "orig": "language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 95.502, "r_y0": 300.128, "r_x1": 286.365, "r_y1": 300.128, "r_x2": 286.365, "r_y2": 291.576, "r_x3": 95.502, "r_y3": 291.576, "coord_origin": "TOPLEFT"}, "text": "Second, we want our algorithm to leverage as", "orig": "Second, we want our algorithm to leverage as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 312.083, "r_x1": 286.365, "r_y1": 312.083, "r_x2": 286.365, "r_y2": 303.531, "r_x3": 50.112, "r_y3": 303.531, "coord_origin": "TOPLEFT"}, "text": "much data as possible from the original PDF document. For", "orig": "much data as possible from the original PDF document. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 324.038, "r_x1": 286.365, "r_y1": 324.038, "r_x2": 286.365, "r_y2": 315.486, "r_x3": 50.112, "r_y3": 315.486, "coord_origin": "TOPLEFT"}, "text": "programmatic PDF documents, the text-cells can often be", "orig": "programmatic PDF documents, the text-cells can often be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 335.993, "r_x1": 286.365, "r_y1": 335.993, "r_x2": 286.365, "r_y2": 327.441, "r_x3": 50.112, "r_y3": 327.441, "coord_origin": "TOPLEFT"}, "text": "extracted much faster and with higher accuracy compared", "orig": "extracted much faster and with higher accuracy compared", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 347.948, "r_x1": 286.365, "r_y1": 347.948, "r_x2": 286.365, "r_y2": 339.396, "r_x3": 50.112, "r_y3": 339.396, "coord_origin": "TOPLEFT"}, "text": "to OCR methods. Last but not least, we want to have a di-", "orig": "to OCR methods. Last but not least, we want to have a di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 359.904, "r_x1": 286.365, "r_y1": 359.904, "r_x2": 286.365, "r_y2": 351.352, "r_x3": 50.112, "r_y3": 351.352, "coord_origin": "TOPLEFT"}, "text": "rect link between the table-cell and its bounding box in the", "orig": "rect link between the table-cell and its bounding box in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 371.859, "r_x1": 76.951, "r_y1": 371.859, "r_x2": 76.951, "r_y2": 363.307, "r_x3": 50.112, "r_y3": 363.307, "coord_origin": "TOPLEFT"}, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 384.267, "r_x1": 286.365, "r_y1": 384.267, "r_x2": 286.365, "r_y2": 375.715, "r_x3": 62.067, "r_y3": 375.715, "coord_origin": "TOPLEFT"}, "text": "To meet the design criteria listed above, we developed a", "orig": "To meet the design criteria listed above, we developed a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 396.222, "r_x1": 120.986, "r_y1": 396.222, "r_x2": 120.986, "r_y2": 387.67, "r_x3": 50.112, "r_y3": 387.67, "coord_origin": "TOPLEFT"}, "text": "new model called", "orig": "new model called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 123.901, "r_y0": 396.238, "r_x1": 179.731, "r_y1": 396.238, "r_x2": 179.731, "r_y2": 387.282, "r_x3": 123.901, "r_y3": 387.282, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.646, "r_y0": 396.222, "r_x1": 286.367, "r_y1": 396.222, "r_x2": 286.367, "r_y2": 387.67, "r_x3": 182.646, "r_y3": 387.67, "coord_origin": "TOPLEFT"}, "text": "and a synthetically gener-", "orig": "and a synthetically gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 408.177, "r_x1": 181.758, "r_y1": 408.177, "r_x2": 181.758, "r_y2": 399.625, "r_x3": 50.112, "r_y3": 399.625, "coord_origin": "TOPLEFT"}, "text": "ated table structure dataset called", "orig": "ated table structure dataset called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.104, "r_y0": 408.193, "r_x1": 240.203, "r_y1": 408.193, "r_x2": 240.203, "r_y2": 399.237, "r_x3": 184.104, "r_y3": 399.237, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.204, "r_y0": 403.942, "r_x1": 243.691, "r_y1": 403.942, "r_x2": 243.691, "r_y2": 397.956, "r_x3": 240.204, "r_y3": 397.956, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 244.189, "r_y0": 408.177, "r_x1": 246.68, "r_y1": 408.177, "r_x2": 246.68, "r_y2": 399.625, "r_x3": 244.189, "r_y3": 399.625, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.718, "r_y0": 408.177, "r_x1": 286.361, "r_y1": 408.177, "r_x2": 286.361, "r_y2": 399.625, "r_x3": 249.718, "r_y3": 399.625, "coord_origin": "TOPLEFT"}, "text": "In partic-", "orig": "In partic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 420.132, "r_x1": 67.696, "r_y1": 420.132, "r_x2": 67.696, "r_y2": 411.58, "r_x3": 50.112, "r_y3": 411.58, "coord_origin": "TOPLEFT"}, "text": "ular,", "orig": "ular,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 71.322, "r_y0": 420.132, "r_x1": 286.365, "r_y1": 420.132, "r_x2": 286.365, "r_y2": 411.58, "r_x3": 71.322, "r_y3": 411.58, "coord_origin": "TOPLEFT"}, "text": "our contributions in this work can be summarised as", "orig": "our contributions in this work can be summarised as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 432.087, "r_x1": 82.52, "r_y1": 432.087, "r_x2": 82.52, "r_y2": 423.535, "r_x3": 50.112, "r_y3": 423.535, "coord_origin": "TOPLEFT"}, "text": "follows:", "orig": "follows:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 453.372, "r_x1": 65.056, "r_y1": 453.372, "r_x2": 65.056, "r_y2": 444.82, "r_x3": 61.569, "r_y3": 444.82, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 453.372, "r_x1": 117.101, "r_y1": 453.372, "r_x2": 117.101, "r_y2": 444.82, "r_x3": 70.037, "r_y3": 444.82, "coord_origin": "TOPLEFT"}, "text": "We propose", "orig": "We propose", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.59, "r_y0": 453.388, "r_x1": 175.42, "r_y1": 453.388, "r_x2": 175.42, "r_y2": 444.432, "r_x3": 119.59, "r_y3": 444.432, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.421, "r_y0": 453.372, "r_x1": 286.365, "r_y1": 453.372, "r_x2": 286.365, "r_y2": 444.82, "r_x3": 175.421, "r_y3": 444.82, "coord_origin": "TOPLEFT"}, "text": ", a transformer based model", "orig": ", a transformer based model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 465.327, "r_x1": 286.365, "r_y1": 465.327, "r_x2": 286.365, "r_y2": 456.775, "r_x3": 70.037, "r_y3": 456.775, "coord_origin": "TOPLEFT"}, "text": "that predicts tables structure and bounding boxes for", "orig": "that predicts tables structure and bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 477.282, "r_x1": 286.365, "r_y1": 477.282, "r_x2": 286.365, "r_y2": 468.73, "r_x3": 70.037, "r_y3": 468.73, "coord_origin": "TOPLEFT"}, "text": "the table content simultaneously in an end-to-end ap-", "orig": "the table content simultaneously in an end-to-end ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 489.237, "r_x1": 99.636, "r_y1": 489.237, "r_x2": 99.636, "r_y2": 480.685, "r_x3": 70.037, "r_y3": 480.685, "coord_origin": "TOPLEFT"}, "text": "proach.", "orig": "proach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 510.974, "r_x1": 65.056, "r_y1": 510.974, "r_x2": 65.056, "r_y2": 502.422, "r_x3": 61.569, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 510.974, "r_x1": 111.88, "r_y1": 510.974, "r_x2": 111.88, "r_y2": 502.422, "r_x3": 70.037, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "Across all", "orig": "Across all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.084, "r_y0": 510.974, "r_x1": 196.104, "r_y1": 510.974, "r_x2": 196.104, "r_y2": 502.422, "r_x3": 116.084, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "benchmark datasets", "orig": "benchmark datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.31, "r_y0": 510.99, "r_x1": 256.14, "r_y1": 510.99, "r_x2": 256.14, "r_y2": 502.034, "r_x3": 200.31, "r_y3": 502.034, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 260.35, "r_y0": 510.974, "r_x1": 286.362, "r_y1": 510.974, "r_x2": 286.362, "r_y2": 502.422, "r_x3": 260.35, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "signif-", "orig": "signif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 522.929, "r_x1": 97.155, "r_y1": 522.929, "r_x2": 97.155, "r_y2": 514.377, "r_x3": 70.037, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "icantly", "orig": "icantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.678, "r_y0": 522.929, "r_x1": 150.375, "r_y1": 522.929, "r_x2": 150.375, "r_y2": 514.377, "r_x3": 101.678, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "outperforms", "orig": "outperforms", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.898, "r_y0": 522.929, "r_x1": 186.301, "r_y1": 522.929, "r_x2": 186.301, "r_y2": 514.377, "r_x3": 154.898, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "existing", "orig": "existing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 190.824, "r_y0": 522.929, "r_x1": 250.021, "r_y1": 522.929, "r_x2": 250.021, "r_y2": 514.377, "r_x3": 190.824, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "state-of-the-art", "orig": "state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 254.544, "r_y0": 522.929, "r_x1": 286.365, "r_y1": 522.929, "r_x2": 286.365, "r_y2": 514.377, "r_x3": 254.544, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "metrics,", "orig": "metrics,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 534.885, "r_x1": 286.365, "r_y1": 534.885, "r_x2": 286.365, "r_y2": 526.3330000000001, "r_x3": 70.037, "r_y3": 526.3330000000001, "coord_origin": "TOPLEFT"}, "text": "while being much more efficient in training and infer-", "orig": "while being much more efficient in training and infer-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 546.84, "r_x1": 161.653, "r_y1": 546.84, "r_x2": 161.653, "r_y2": 538.288, "r_x3": 70.037, "r_y3": 538.288, "coord_origin": "TOPLEFT"}, "text": "ence to existing works.", "orig": "ence to existing works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 568.577, "r_x1": 65.056, "r_y1": 568.577, "r_x2": 65.056, "r_y2": 560.025, "r_x3": 61.569, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 568.577, "r_x1": 116.712, "r_y1": 568.577, "r_x2": 116.712, "r_y2": 560.025, "r_x3": 70.037, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "We present", "orig": "We present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 121.583, "r_y0": 568.593, "r_x1": 177.682, "r_y1": 568.593, "r_x2": 177.682, "r_y2": 559.637, "r_x3": 121.583, "r_y3": 559.637, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.553, "r_y0": 568.577, "r_x1": 186.976, "r_y1": 568.577, "r_x2": 186.976, "r_y2": 560.025, "r_x3": 182.553, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 191.848, "r_y0": 568.577, "r_x1": 242.767, "r_y1": 568.577, "r_x2": 242.767, "r_y2": 560.025, "r_x3": 191.848, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "synthetically", "orig": "synthetically", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.639, "r_y0": 568.577, "r_x1": 286.363, "r_y1": 568.577, "r_x2": 286.363, "r_y2": 560.025, "r_x3": 247.639, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "generated", "orig": "generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 580.532, "r_x1": 286.365, "r_y1": 580.532, "r_x2": 286.365, "r_y2": 571.98, "r_x3": 70.037, "r_y3": 571.98, "coord_origin": "TOPLEFT"}, "text": "dataset, with various appearance styles and complex-", "orig": "dataset, with various appearance styles and complex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 592.487, "r_x1": 82.401, "r_y1": 592.487, "r_x2": 82.401, "r_y2": 583.935, "r_x3": 70.037, "r_y3": 583.935, "coord_origin": "TOPLEFT"}, "text": "ity.", "orig": "ity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 614.2239999999999, "r_x1": 65.056, "r_y1": 614.2239999999999, "r_x2": 65.056, "r_y2": 605.672, "r_x3": 61.569, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 614.2239999999999, "r_x1": 132.005, "r_y1": 614.2239999999999, "r_x2": 132.005, "r_y2": 605.672, "r_x3": 70.037, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "An augmented", "orig": "An augmented", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.082, "r_y0": 614.2239999999999, "r_x1": 165.748, "r_y1": 614.2239999999999, "r_x2": 165.748, "r_y2": 605.672, "r_x3": 138.082, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "dataset", "orig": "dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.815, "r_y0": 614.2239999999999, "r_x1": 194.5, "r_y1": 614.2239999999999, "r_x2": 194.5, "r_y2": 605.672, "r_x3": 171.815, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "based", "orig": "based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.577, "r_y0": 614.2239999999999, "r_x1": 210.54, "r_y1": 614.2239999999999, "r_x2": 210.54, "r_y2": 605.672, "r_x3": 200.577, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "on", "orig": "on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.617, "r_y0": 614.2239999999999, "r_x1": 261.2, "r_y1": 614.2239999999999, "r_x2": 261.2, "r_y2": 605.672, "r_x3": 216.617, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 267.277, "r_y0": 614.2239999999999, "r_x1": 286.365, "r_y1": 614.2239999999999, "r_x2": 286.365, "r_y2": 605.672, "r_x3": 267.277, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "[37],", "orig": "[37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 626.179, "r_x1": 135.521, "r_y1": 626.179, "r_x2": 135.521, "r_y2": 617.627, "r_x3": 70.037, "r_y3": 617.627, "coord_origin": "TOPLEFT"}, "text": "FinTabNet [36],", "orig": "FinTabNet [36],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.925, "r_y0": 626.179, "r_x1": 286.365, "r_y1": 626.179, "r_x2": 286.365, "r_y2": 617.627, "r_x3": 139.925, "r_y3": 617.627, "coord_origin": "TOPLEFT"}, "text": "and TableBank [17] with generated", "orig": "and TableBank [17] with generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 638.135, "r_x1": 198.056, "r_y1": 638.135, "r_x2": 198.056, "r_y2": 629.583, "r_x3": 70.037, "r_y3": 629.583, "coord_origin": "TOPLEFT"}, "text": "ground-truth for reproducibility.", "orig": "ground-truth for reproducibility.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 659.419, "r_x1": 204.452, "r_y1": 659.419, "r_x2": 204.452, "r_y2": 650.867, "r_x3": 62.067, "r_y3": 650.867, "coord_origin": "TOPLEFT"}, "text": "The paper is structured as follows.", "orig": "The paper is structured as follows.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.789, "r_y0": 659.419, "r_x1": 286.365, "r_y1": 659.419, "r_x2": 286.365, "r_y2": 650.867, "r_x3": 210.789, "r_y3": 650.867, "coord_origin": "TOPLEFT"}, "text": "In Sec. 2, we give", "orig": "In Sec. 2, we give", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 671.374, "r_x1": 240.896, "r_y1": 671.374, "r_x2": 240.896, "r_y2": 662.822, "r_x3": 50.112, "r_y3": 662.822, "coord_origin": "TOPLEFT"}, "text": "a brief overview of the current state-of-the-art.", "orig": "a brief overview of the current state-of-the-art.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.833, "r_y0": 671.374, "r_x1": 286.365, "r_y1": 671.374, "r_x2": 286.365, "r_y2": 662.822, "r_x3": 246.833, "r_y3": 662.822, "coord_origin": "TOPLEFT"}, "text": "In Sec. 3,", "orig": "In Sec. 3,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 683.329, "r_x1": 227.396, "r_y1": 683.329, "r_x2": 227.396, "r_y2": 674.777, "r_x3": 50.112, "r_y3": 674.777, "coord_origin": "TOPLEFT"}, "text": "we describe the datasets on which we train.", "orig": "we describe the datasets on which we train.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.467, "r_y0": 683.329, "r_x1": 286.365, "r_y1": 683.329, "r_x2": 286.365, "r_y2": 674.777, "r_x3": 232.467, "r_y3": 674.777, "coord_origin": "TOPLEFT"}, "text": "In Sec. 4, we", "orig": "In Sec. 4, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 695.284, "r_x1": 286.365, "r_y1": 695.284, "r_x2": 286.365, "r_y2": 686.732, "r_x3": 50.112, "r_y3": 686.732, "coord_origin": "TOPLEFT"}, "text": "introduce the TableFormer model-architecture and describe", "orig": "introduce the TableFormer model-architecture and describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.971, "r_y0": 709.427, "r_x1": 63.96, "r_y1": 709.427, "r_x2": 63.96, "r_y2": 704.296, "r_x3": 60.971, "r_y3": 704.296, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 64.458, "r_y0": 712.653, "r_x1": 183.731, "r_y1": 712.653, "r_x2": 183.731, "r_y2": 705.811, "r_x3": 64.458, "r_y3": 705.811, "coord_origin": "TOPLEFT"}, "text": "https://github.com/IBM/SynthTabNet", "orig": "https://github.com/IBM/SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 545.115, "r_y1": 84.029, "r_x2": 545.115, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "its results &performance in Sec. 5. As a conclusion, we de-", "orig": "its results &performance in Sec. 5. As a conclusion, we de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 95.98400000000004, "r_x1": 545.115, "r_y1": 95.98400000000004, "r_x2": 545.115, "r_y2": 87.43200000000002, "r_x3": 308.862, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "scribe how this new model-architecture can be re-purposed", "orig": "scribe how this new model-architecture can be re-purposed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 107.93899999999996, "r_x1": 508.084, "r_y1": 107.93899999999996, "r_x2": 508.084, "r_y2": 99.38699999999994, "r_x3": 308.862, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "for other tasks in the computer-vision community.", "orig": "for other tasks in the computer-vision community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 132.48000000000002, "r_x1": 498.28, "r_y1": 132.48000000000002, "r_x2": 498.28, "r_y2": 121.73199999999997, "r_x3": 308.862, "r_y3": 121.73199999999997, "coord_origin": "TOPLEFT"}, "text": "2. Previous work and State of the Art", "orig": "2. Previous work and State of the Art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 151.04200000000003, "r_x1": 545.115, "r_y1": 151.04200000000003, "r_x2": 545.115, "r_y2": 142.49, "r_x3": 320.817, "r_y3": 142.49, "coord_origin": "TOPLEFT"}, "text": "Identifying the structure of a table has been an outstand-", "orig": "Identifying the structure of a table has been an outstand-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 162.99699999999996, "r_x1": 545.115, "r_y1": 162.99699999999996, "r_x2": 545.115, "r_y2": 154.44500000000005, "r_x3": 308.862, "r_y3": 154.44500000000005, "coord_origin": "TOPLEFT"}, "text": "ing problem in the document-parsing community, that mo-", "orig": "ing problem in the document-parsing community, that mo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 174.952, "r_x1": 334.376, "r_y1": 174.952, "r_x2": 334.376, "r_y2": 166.39999999999998, "r_x3": 308.862, "r_y3": 166.39999999999998, "coord_origin": "TOPLEFT"}, "text": "tivates", "orig": "tivates", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.192, "r_y0": 174.952, "r_x1": 522.56, "r_y1": 174.952, "r_x2": 522.56, "r_y2": 166.39999999999998, "r_x3": 338.192, "r_y3": 166.39999999999998, "coord_origin": "TOPLEFT"}, "text": "many organised public challenges [6, 4, 14].", "orig": "many organised public challenges [6, 4, 14].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 529.623, "r_y0": 174.952, "r_x1": 545.115, "r_y1": 174.952, "r_x2": 545.115, "r_y2": 166.39999999999998, "r_x3": 529.623, "r_y3": 166.39999999999998, "coord_origin": "TOPLEFT"}, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 186.90700000000004, "r_x1": 545.115, "r_y1": 186.90700000000004, "r_x2": 545.115, "r_y2": 178.35500000000002, "r_x3": 308.862, "r_y3": 178.35500000000002, "coord_origin": "TOPLEFT"}, "text": "difficulty of the problem can be attributed to a number of", "orig": "difficulty of the problem can be attributed to a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 198.86199999999997, "r_x1": 545.115, "r_y1": 198.86199999999997, "r_x2": 545.115, "r_y2": 190.30999999999995, "r_x3": 308.862, "r_y3": 190.30999999999995, "coord_origin": "TOPLEFT"}, "text": "factors. First, there is a large variety in the shapes and sizes", "orig": "factors. First, there is a large variety in the shapes and sizes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 210.817, "r_x1": 346.979, "r_y1": 210.817, "r_x2": 346.979, "r_y2": 202.265, "r_x3": 308.862, "r_y3": 202.265, "coord_origin": "TOPLEFT"}, "text": "of tables.", "orig": "of tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.869, "r_y0": 210.817, "r_x1": 508.642, "r_y1": 210.817, "r_x2": 508.642, "r_y2": 202.265, "r_x3": 354.869, "r_y3": 202.265, "coord_origin": "TOPLEFT"}, "text": "Such large variety requires a flexible", "orig": "Such large variety requires a flexible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.737, "r_y0": 210.817, "r_x1": 545.115, "r_y1": 210.817, "r_x2": 545.115, "r_y2": 202.265, "r_x3": 512.737, "r_y3": 202.265, "coord_origin": "TOPLEFT"}, "text": "method.", "orig": "method.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 222.77300000000002, "r_x1": 545.115, "r_y1": 222.77300000000002, "r_x2": 545.115, "r_y2": 214.221, "r_x3": 308.862, "r_y3": 214.221, "coord_origin": "TOPLEFT"}, "text": "This is especially true for complex column- and row head-", "orig": "This is especially true for complex column- and row head-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 234.72799999999995, "r_x1": 322.969, "r_y1": 234.72799999999995, "r_x2": 322.969, "r_y2": 226.17600000000004, "r_x3": 308.862, "r_y3": 226.17600000000004, "coord_origin": "TOPLEFT"}, "text": "ers,", "orig": "ers,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.084, "r_y0": 234.72799999999995, "r_x1": 530.918, "r_y1": 234.72799999999995, "r_x2": 530.918, "r_y2": 226.17600000000004, "r_x3": 327.084, "r_y3": 226.17600000000004, "coord_origin": "TOPLEFT"}, "text": "which can be extremely intricate and demanding.", "orig": "which can be extremely intricate and demanding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 537.922, "r_y0": 234.72799999999995, "r_x1": 545.115, "r_y1": 234.72799999999995, "r_x2": 545.115, "r_y2": 226.17600000000004, "r_x3": 537.922, "r_y3": 226.17600000000004, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 246.683, "r_x1": 545.115, "r_y1": 246.683, "r_x2": 545.115, "r_y2": 238.13099999999997, "r_x3": 308.862, "r_y3": 238.13099999999997, "coord_origin": "TOPLEFT"}, "text": "second factor of complexity is the lack of data with regard", "orig": "second factor of complexity is the lack of data with regard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.63800000000003, "r_x1": 545.115, "r_y1": 258.63800000000003, "r_x2": 545.115, "r_y2": 250.086, "r_x3": 308.862, "r_y3": 250.086, "coord_origin": "TOPLEFT"}, "text": "to table-structure. Until the publication of PubTabNet [37],", "orig": "to table-structure. Until the publication of PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 270.59299999999996, "r_x1": 439.84, "r_y1": 270.59299999999996, "r_x2": 439.84, "r_y2": 262.04100000000005, "r_x3": 308.862, "r_y3": 262.04100000000005, "coord_origin": "TOPLEFT"}, "text": "there were no large datasets (i.e.", "orig": "there were no large datasets (i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 444.44, "r_y0": 270.429, "r_x1": 452.189, "r_y1": 270.429, "r_x2": 452.189, "r_y2": 261.72299999999996, "r_x3": 444.44, "r_y3": 261.72299999999996, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.89, "r_y0": 270.429, "r_x1": 470.834, "r_y1": 270.429, "r_x2": 470.834, "r_y2": 261.72299999999996, "r_x3": 455.89, "r_y3": 261.72299999999996, "coord_origin": "TOPLEFT"}, "text": "100", "orig": "100", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 470.834, "r_y0": 270.59299999999996, "r_x1": 545.115, "r_y1": 270.59299999999996, "r_x2": 545.115, "r_y2": 262.04100000000005, "r_x3": 470.834, "r_y3": 262.04100000000005, "coord_origin": "TOPLEFT"}, "text": "K tables) that pro-", "orig": "K tables) that pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 282.548, "r_x1": 545.115, "r_y1": 282.548, "r_x2": 545.115, "r_y2": 273.996, "r_x3": 308.862, "r_y3": 273.996, "coord_origin": "TOPLEFT"}, "text": "vided structure information. This happens primarily due to", "orig": "vided structure information. This happens primarily due to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 294.504, "r_x1": 545.115, "r_y1": 294.504, "r_x2": 545.115, "r_y2": 285.952, "r_x3": 308.862, "r_y3": 285.952, "coord_origin": "TOPLEFT"}, "text": "the fact that tables are notoriously time-consuming to an-", "orig": "the fact that tables are notoriously time-consuming to an-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 306.459, "r_x1": 545.115, "r_y1": 306.459, "r_x2": 545.115, "r_y2": 297.907, "r_x3": 308.862, "r_y3": 297.907, "coord_origin": "TOPLEFT"}, "text": "notate by hand. However, this has definitely changed in re-", "orig": "notate by hand. However, this has definitely changed in re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 318.414, "r_x1": 545.115, "r_y1": 318.414, "r_x2": 545.115, "r_y2": 309.862, "r_x3": 308.862, "r_y3": 309.862, "coord_origin": "TOPLEFT"}, "text": "cent years with the deliverance of PubTabNet [37], FinTab-", "orig": "cent years with the deliverance of PubTabNet [37], FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 330.369, "r_x1": 425.923, "r_y1": 330.369, "r_x2": 425.923, "r_y2": 321.817, "r_x3": 308.862, "r_y3": 321.817, "coord_origin": "TOPLEFT"}, "text": "Net [36], TableBank [17] etc.", "orig": "Net [36], TableBank [17] etc.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 342.39, "r_x1": 391.492, "r_y1": 342.39, "r_x2": 391.492, "r_y2": 333.838, "r_x3": 320.817, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "Before the rising", "orig": "Before the rising", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.845, "r_y0": 342.39, "r_x1": 436.802, "r_y1": 342.39, "r_x2": 436.802, "r_y2": 333.838, "r_x3": 395.845, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "popularity", "orig": "popularity", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.145, "r_y0": 342.39, "r_x1": 449.444, "r_y1": 342.39, "r_x2": 449.444, "r_y2": 333.838, "r_x3": 441.145, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.798, "r_y0": 342.39, "r_x1": 545.115, "r_y1": 342.39, "r_x2": 545.115, "r_y2": 333.838, "r_x3": 453.798, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "deep neural networks,", "orig": "deep neural networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 354.345, "r_x1": 545.115, "r_y1": 354.345, "r_x2": 545.115, "r_y2": 345.793, "r_x3": 308.862, "r_y3": 345.793, "coord_origin": "TOPLEFT"}, "text": "the community relied heavily on heuristic and/or statistical", "orig": "the community relied heavily on heuristic and/or statistical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 366.3, "r_x1": 545.115, "r_y1": 366.3, "r_x2": 545.115, "r_y2": 357.748, "r_x3": 308.862, "r_y3": 357.748, "coord_origin": "TOPLEFT"}, "text": "methods to do table structure identification [3, 7, 11, 5, 13,", "orig": "methods to do table structure identification [3, 7, 11, 5, 13,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 378.256, "r_x1": 324.633, "r_y1": 378.256, "r_x2": 324.633, "r_y2": 369.704, "r_x3": 308.862, "r_y3": 369.704, "coord_origin": "TOPLEFT"}, "text": "28].", "orig": "28].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 329.634, "r_y0": 378.256, "r_x1": 545.115, "r_y1": 378.256, "r_x2": 545.115, "r_y2": 369.704, "r_x3": 329.634, "r_y3": 369.704, "coord_origin": "TOPLEFT"}, "text": "Although such methods work well on constrained ta-", "orig": "Although such methods work well on constrained ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 390.211, "r_x1": 545.115, "r_y1": 390.211, "r_x2": 545.115, "r_y2": 381.659, "r_x3": 308.862, "r_y3": 381.659, "coord_origin": "TOPLEFT"}, "text": "bles [12], a more data-driven approach can be applied due", "orig": "bles [12], a more data-driven approach can be applied due", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 402.166, "r_x1": 545.115, "r_y1": 402.166, "r_x2": 545.115, "r_y2": 393.614, "r_x3": 308.862, "r_y3": 393.614, "coord_origin": "TOPLEFT"}, "text": "to the advent of convolutional neural networks (CNNs) and", "orig": "to the advent of convolutional neural networks (CNNs) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 414.121, "r_x1": 438.416, "r_y1": 414.121, "r_x2": 438.416, "r_y2": 405.569, "r_x3": 308.862, "r_y3": 405.569, "coord_origin": "TOPLEFT"}, "text": "the availability of large datasets.", "orig": "the availability of large datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.231, "r_y0": 414.121, "r_x1": 545.115, "r_y1": 414.121, "r_x2": 545.115, "r_y2": 405.569, "r_x3": 442.231, "r_y3": 405.569, "coord_origin": "TOPLEFT"}, "text": "To the best-of-our knowl-", "orig": "To the best-of-our knowl-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 426.076, "r_x1": 545.115, "r_y1": 426.076, "r_x2": 545.115, "r_y2": 417.524, "r_x3": 308.862, "r_y3": 417.524, "coord_origin": "TOPLEFT"}, "text": "edge, there are currently two different types of network ar-", "orig": "edge, there are currently two different types of network ar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 438.032, "r_x1": 545.115, "r_y1": 438.032, "r_x2": 545.115, "r_y2": 429.48, "r_x3": 308.862, "r_y3": 429.48, "coord_origin": "TOPLEFT"}, "text": "chitecture that are being pursued for state-of-the-art table-", "orig": "chitecture that are being pursued for state-of-the-art table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 449.987, "r_x1": 401.285, "r_y1": 449.987, "r_x2": 401.285, "r_y2": 441.435, "r_x3": 308.862, "r_y3": 441.435, "coord_origin": "TOPLEFT"}, "text": "structure identification.", "orig": "structure identification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 462.024, "r_x1": 423.262, "r_y1": 462.024, "r_x2": 423.262, "r_y2": 453.068, "r_x3": 320.817, "r_y3": 453.068, "coord_origin": "TOPLEFT"}, "text": "Image-to-Text networks", "orig": "Image-to-Text networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.267, "r_y0": 462.008, "r_x1": 426.037, "r_y1": 462.008, "r_x2": 426.037, "r_y2": 453.456, "r_x3": 423.267, "r_y3": 453.456, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.769, "r_y0": 462.008, "r_x1": 545.11, "r_y1": 462.008, "r_x2": 545.11, "r_y2": 453.456, "r_x3": 430.769, "r_y3": 453.456, "coord_origin": "TOPLEFT"}, "text": "In this type of network, one", "orig": "In this type of network, one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 473.963, "r_x1": 340.404, "r_y1": 473.963, "r_x2": 340.404, "r_y2": 465.411, "r_x3": 308.862, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "predicts", "orig": "predicts", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.116, "r_y0": 473.963, "r_x1": 349.539, "r_y1": 473.963, "r_x2": 349.539, "r_y2": 465.411, "r_x3": 345.116, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.252, "r_y0": 473.963, "r_x1": 390.765, "r_y1": 473.963, "r_x2": 390.765, "r_y2": 465.411, "r_x3": 354.252, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "sequence", "orig": "sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.477, "r_y0": 473.963, "r_x1": 403.776, "r_y1": 473.963, "r_x2": 403.776, "r_y2": 465.411, "r_x3": 395.477, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.488, "r_y0": 473.963, "r_x1": 434.401, "r_y1": 473.963, "r_x2": 434.401, "r_y2": 465.411, "r_x3": 408.488, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.113, "r_y0": 473.963, "r_x1": 469.001, "r_y1": 473.963, "r_x2": 469.001, "r_y2": 465.411, "r_x3": 439.113, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "starting", "orig": "starting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 473.713, "r_y0": 473.963, "r_x1": 545.115, "r_y1": 473.963, "r_x2": 545.115, "r_y2": 465.411, "r_x3": 473.713, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "from an encoded", "orig": "from an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 485.918, "r_x1": 335.701, "r_y1": 485.918, "r_x2": 335.701, "r_y2": 477.366, "r_x3": 308.862, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.853, "r_y0": 485.918, "r_x1": 411.009, "r_y1": 485.918, "r_x2": 411.009, "r_y2": 477.366, "r_x3": 345.853, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "Such sequences", "orig": "Such sequences", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 415.85, "r_y0": 485.918, "r_x1": 424.149, "r_y1": 485.918, "r_x2": 424.149, "r_y2": 477.366, "r_x3": 415.85, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.001, "r_y0": 485.918, "r_x1": 454.914, "r_y1": 485.918, "r_x2": 454.914, "r_y2": 477.366, "r_x3": 429.001, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.756, "r_y0": 485.918, "r_x1": 473.584, "r_y1": 485.918, "r_x2": 473.584, "r_y2": 477.366, "r_x3": 459.756, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "can", "orig": "can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.425, "r_y0": 485.918, "r_x1": 487.83, "r_y1": 485.918, "r_x2": 487.83, "r_y2": 477.366, "r_x3": 478.425, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "be", "orig": "be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 492.682, "r_y0": 485.918, "r_x1": 545.115, "r_y1": 485.918, "r_x2": 545.115, "r_y2": 477.366, "r_x3": 492.682, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "HTML table", "orig": "HTML table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 497.873, "r_x1": 459.218, "r_y1": 497.873, "r_x2": 459.218, "r_y2": 489.321, "r_x3": 308.862, "r_y3": 489.321, "coord_origin": "TOPLEFT"}, "text": "tags [37, 17] or LaTeX symbols[10].", "orig": "tags [37, 17] or LaTeX symbols[10].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.115, "r_y0": 497.873, "r_x1": 545.115, "r_y1": 497.873, "r_x2": 545.115, "r_y2": 489.321, "r_x3": 465.115, "r_y3": 489.321, "coord_origin": "TOPLEFT"}, "text": "The choice of sym-", "orig": "The choice of sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 509.828, "r_x1": 545.115, "r_y1": 509.828, "r_x2": 545.115, "r_y2": 501.276, "r_x3": 308.862, "r_y3": 501.276, "coord_origin": "TOPLEFT"}, "text": "bols is ultimately not very important, since one can be trans-", "orig": "bols is ultimately not very important, since one can be trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 521.784, "r_x1": 396.692, "r_y1": 521.784, "r_x2": 396.692, "r_y2": 513.232, "r_x3": 308.862, "r_y3": 513.232, "coord_origin": "TOPLEFT"}, "text": "formed into the other.", "orig": "formed into the other.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.265, "r_y0": 521.784, "r_x1": 545.115, "r_y1": 521.784, "r_x2": 545.115, "r_y2": 513.232, "r_x3": 401.265, "r_y3": 513.232, "coord_origin": "TOPLEFT"}, "text": "There are however subtle variations", "orig": "There are however subtle variations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.739, "r_x1": 433.484, "r_y1": 533.739, "r_x2": 433.484, "r_y2": 525.187, "r_x3": 308.862, "r_y3": 525.187, "coord_origin": "TOPLEFT"}, "text": "in the Image-to-Text networks.", "orig": "in the Image-to-Text networks.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 438.187, "r_y0": 533.739, "r_x1": 545.115, "r_y1": 533.739, "r_x2": 545.115, "r_y2": 525.187, "r_x3": 438.187, "r_y3": 525.187, "coord_origin": "TOPLEFT"}, "text": "The easiest network archi-", "orig": "The easiest network archi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.694, "r_x1": 420.941, "r_y1": 545.694, "r_x2": 420.941, "r_y2": 537.142, "r_x3": 308.862, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "tectures are 'image-encoder", "orig": "tectures are 'image-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.595, "r_y0": 545.388, "r_x1": 433.558, "r_y1": 545.388, "r_x2": 433.558, "r_y2": 536.8240000000001, "r_x3": 423.595, "r_y3": 536.8240000000001, "coord_origin": "TOPLEFT"}, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.212, "r_y0": 545.694, "r_x1": 545.113, "r_y1": 545.694, "r_x2": 545.113, "r_y2": 537.142, "r_x3": 436.212, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "text-decoder' (IETD), sim-", "orig": "text-decoder' (IETD), sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 557.649, "r_x1": 545.115, "r_y1": 557.649, "r_x2": 545.115, "r_y2": 549.097, "r_x3": 308.862, "r_y3": 549.097, "coord_origin": "TOPLEFT"}, "text": "ilar to network architectures that try to provide captions to", "orig": "ilar to network architectures that try to provide captions to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.604, "r_x1": 545.115, "r_y1": 569.604, "r_x2": 545.115, "r_y2": 561.052, "r_x3": 308.862, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "images [32]. In these IETD networks, one expects as output", "orig": "images [32]. In these IETD networks, one expects as output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 581.559, "r_x1": 503.671, "r_y1": 581.559, "r_x2": 503.671, "r_y2": 573.0070000000001, "r_x3": 308.862, "r_y3": 573.0070000000001, "coord_origin": "TOPLEFT"}, "text": "the LaTeX/HTML string of the entire table, i.e.", "orig": "the LaTeX/HTML string of the entire table, i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 509.579, "r_y0": 581.559, "r_x1": 545.115, "r_y1": 581.559, "r_x2": 545.115, "r_y2": 573.0070000000001, "r_x3": 509.579, "r_y3": 573.0070000000001, "coord_origin": "TOPLEFT"}, "text": "the sym-", "orig": "the sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 593.515, "r_x1": 545.115, "r_y1": 593.515, "r_x2": 545.115, "r_y2": 584.963, "r_x3": 308.862, "r_y3": 584.963, "coord_origin": "TOPLEFT"}, "text": "bols necessary for creating the table with the content of the", "orig": "bols necessary for creating the table with the content of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.47, "r_x1": 330.72, "r_y1": 605.47, "r_x2": 330.72, "r_y2": 596.918, "r_x3": 308.862, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "table.", "orig": "table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.536, "r_y0": 605.47, "r_x1": 497.075, "r_y1": 605.47, "r_x2": 497.075, "r_y2": 596.918, "r_x3": 334.536, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "Another approach is the 'image-encoder", "orig": "Another approach is the 'image-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 499.805, "r_y0": 605.164, "r_x1": 509.768, "r_y1": 605.164, "r_x2": 509.768, "r_y2": 596.6, "r_x3": 499.805, "r_y3": 596.6, "coord_origin": "TOPLEFT"}, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.501, "r_y0": 605.47, "r_x1": 545.109, "r_y1": 605.47, "r_x2": 545.109, "r_y2": 596.918, "r_x3": 512.501, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "dual de-", "orig": "dual de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.425, "r_x1": 545.115, "r_y1": 617.425, "r_x2": 545.115, "r_y2": 608.873, "r_x3": 308.862, "r_y3": 608.873, "coord_origin": "TOPLEFT"}, "text": "coder' (IEDD) networks. In these type of networks, one has", "orig": "coder' (IEDD) networks. In these type of networks, one has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.38, "r_x1": 545.115, "r_y1": 629.38, "r_x2": 545.115, "r_y2": 620.828, "r_x3": 308.862, "r_y3": 620.828, "coord_origin": "TOPLEFT"}, "text": "two consecutive decoders with different purposes. The first", "orig": "two consecutive decoders with different purposes. The first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.335, "r_x1": 364.782, "r_y1": 641.335, "r_x2": 364.782, "r_y2": 632.783, "r_x3": 308.862, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "decoder is the", "orig": "decoder is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.574, "r_y0": 641.192, "r_x1": 415.614, "r_y1": 641.192, "r_x2": 415.614, "r_y2": 632.604, "r_x3": 367.574, "r_y3": 632.604, "coord_origin": "TOPLEFT"}, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 415.613, "r_y0": 641.335, "r_x1": 418.104, "r_y1": 641.335, "r_x2": 418.104, "r_y2": 632.783, "r_x3": 415.613, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 420.963, "r_y0": 641.335, "r_x1": 433.137, "r_y1": 641.335, "r_x2": 433.137, "r_y2": 632.783, "r_x3": 420.963, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "i.e.", "orig": "i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.122, "r_y0": 641.335, "r_x1": 442.661, "r_y1": 641.335, "r_x2": 442.661, "r_y2": 632.783, "r_x3": 437.122, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 445.441, "r_y0": 641.335, "r_x1": 545.117, "r_y1": 641.335, "r_x2": 545.117, "r_y2": 632.783, "r_x3": 445.441, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "only produces the HTM-", "orig": "only produces the HTM-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.29, "r_x1": 545.115, "r_y1": 653.29, "r_x2": 545.115, "r_y2": 644.738, "r_x3": 308.862, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "L/LaTeX tags which construct an empty table. The second", "orig": "L/LaTeX tags which construct an empty table. The second", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 665.103, "r_x1": 373.599, "r_y1": 665.103, "r_x2": 373.599, "r_y2": 656.515, "r_x3": 308.862, "r_y3": 656.515, "coord_origin": "TOPLEFT"}, "text": "content-decoder", "orig": "content-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.907, "r_y0": 665.246, "r_x1": 545.116, "r_y1": 665.246, "r_x2": 545.116, "r_y2": 656.694, "r_x3": 376.907, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "uses the encoding of the image in combi-", "orig": "uses the encoding of the image in combi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 308.862, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "nation with the output encoding of each cell-tag (from the", "orig": "nation with the output encoding of each cell-tag (from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.013, "r_x1": 356.902, "r_y1": 689.013, "r_x2": 356.902, "r_y2": 680.425, "r_x3": 308.862, "r_y3": 680.425, "coord_origin": "TOPLEFT"}, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.131, "r_y0": 689.156, "r_x1": 360.449, "r_y1": 689.156, "r_x2": 360.449, "r_y2": 680.604, "r_x3": 357.131, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 364.045, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 364.045, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "to generate the textual content of each table", "orig": "to generate the textual content of each table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 325.739, "r_y1": 701.111, "r_x2": 325.739, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "cell.", "orig": "cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.746, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 331.746, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "The network architecture of IEDD is certainly more", "orig": "The network architecture of IEDD is certainly more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "elaborate, but it has the advantage that one can pre-train the", "orig": "elaborate, but it has the advantage that one can pre-train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 12, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 286.365, "b": 95.98400000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9656890034675598, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "considered as a solved problem, given enough ground-truth", "orig": "considered as a solved problem, given enough ground-truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 95.98400000000004, "r_x1": 112.647, "r_y1": 95.98400000000004, "r_x2": 112.647, "r_y2": 87.43200000000002, "r_x3": 50.112, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "data to train on.", "orig": "data to train on.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "text", "bbox": {"l": 50.112, "t": 99.84000000000003, "r": 286.365, "b": 227.94399999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9838606119155884, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 108.39200000000005, "r_x1": 286.365, "r_y1": 108.39200000000005, "r_x2": 286.365, "r_y2": 99.84000000000003, "r_x3": 62.067, "r_y3": 99.84000000000003, "coord_origin": "TOPLEFT"}, "text": "The second problem is called table-structure decompo-", "orig": "The second problem is called table-structure decompo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 120.34699999999998, "r_x1": 74.75, "r_y1": 120.34699999999998, "r_x2": 74.75, "r_y2": 111.79499999999996, "r_x3": 50.112, "r_y3": 111.79499999999996, "coord_origin": "TOPLEFT"}, "text": "sition.", "orig": "sition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.335, "r_y0": 120.34699999999998, "r_x1": 286.365, "r_y1": 120.34699999999998, "r_x2": 286.365, "r_y2": 111.79499999999996, "r_x3": 81.335, "r_y3": 111.79499999999996, "coord_origin": "TOPLEFT"}, "text": "The latter is a long standing problem in the com-", "orig": "The latter is a long standing problem in the com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 132.30200000000002, "r_x1": 235.117, "r_y1": 132.30200000000002, "r_x2": 235.117, "r_y2": 123.75, "r_x3": 50.112, "r_y3": 123.75, "coord_origin": "TOPLEFT"}, "text": "munity of document understanding [6, 4, 14].", "orig": "munity of document understanding [6, 4, 14].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.079, "r_y0": 132.30200000000002, "r_x1": 286.365, "r_y1": 132.30200000000002, "r_x2": 286.365, "r_y2": 123.75, "r_x3": 240.079, "r_y3": 123.75, "coord_origin": "TOPLEFT"}, "text": "Contrary to", "orig": "Contrary to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 144.25699999999995, "r_x1": 286.365, "r_y1": 144.25699999999995, "r_x2": 286.365, "r_y2": 135.70500000000004, "r_x3": 50.112, "r_y3": 135.70500000000004, "coord_origin": "TOPLEFT"}, "text": "the table-location problem, there are no commonly used ap-", "orig": "the table-location problem, there are no commonly used ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 156.21299999999997, "r_x1": 286.365, "r_y1": 156.21299999999997, "r_x2": 286.365, "r_y2": 147.66099999999994, "r_x3": 50.112, "r_y3": 147.66099999999994, "coord_origin": "TOPLEFT"}, "text": "proaches that can easily be re-purposed to solve this prob-", "orig": "proaches that can easily be re-purposed to solve this prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 168.168, "r_x1": 286.365, "r_y1": 168.168, "r_x2": 286.365, "r_y2": 159.61599999999999, "r_x3": 50.112, "r_y3": 159.61599999999999, "coord_origin": "TOPLEFT"}, "text": "lem. Lately, a set of new model-architectures has been pro-", "orig": "lem. Lately, a set of new model-architectures has been pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 180.12300000000005, "r_x1": 286.365, "r_y1": 180.12300000000005, "r_x2": 286.365, "r_y2": 171.57100000000003, "r_x3": 50.112, "r_y3": 171.57100000000003, "coord_origin": "TOPLEFT"}, "text": "posed by the community to address table-structure decom-", "orig": "posed by the community to address table-structure decom-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 192.07799999999997, "r_x1": 286.365, "r_y1": 192.07799999999997, "r_x2": 286.365, "r_y2": 183.52599999999995, "r_x3": 50.112, "r_y3": 183.52599999999995, "coord_origin": "TOPLEFT"}, "text": "position [37, 36, 18, 20]. All these models have some weak-", "orig": "position [37, 36, 18, 20]. All these models have some weak-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 204.03300000000002, "r_x1": 114.51, "r_y1": 204.03300000000002, "r_x2": 114.51, "r_y2": 195.481, "r_x3": 50.112, "r_y3": 195.481, "coord_origin": "TOPLEFT"}, "text": "nesses (see Sec.", "orig": "nesses (see Sec.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.163, "r_y0": 204.03300000000002, "r_x1": 129.952, "r_y1": 204.03300000000002, "r_x2": 129.952, "r_y2": 195.481, "r_x3": 119.163, "r_y3": 195.481, "coord_origin": "TOPLEFT"}, "text": "2).", "orig": "2).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.615, "r_y0": 204.03300000000002, "r_x1": 286.365, "r_y1": 204.03300000000002, "r_x2": 286.365, "r_y2": 195.481, "r_x3": 134.615, "r_y3": 195.481, "coord_origin": "TOPLEFT"}, "text": "The common denominator here is the", "orig": "The common denominator here is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 215.98800000000006, "r_x1": 286.365, "r_y1": 215.98800000000006, "r_x2": 286.365, "r_y2": 207.43600000000004, "r_x3": 50.112, "r_y3": 207.43600000000004, "coord_origin": "TOPLEFT"}, "text": "reliance on textual features and/or the inability to provide", "orig": "reliance on textual features and/or the inability to provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 227.94399999999996, "r_x1": 278.664, "r_y1": 227.94399999999996, "r_x2": 278.664, "r_y2": 219.39200000000005, "r_x3": 50.112, "r_y3": 219.39200000000005, "coord_origin": "TOPLEFT"}, "text": "the bounding box of each table-cell in the original image.", "orig": "the bounding box of each table-cell in the original image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 50.112, "t": 231.79999999999995, "r": 286.365, "b": 371.859, "coord_origin": "TOPLEFT"}, "confidence": 0.9855920076370239, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 240.35199999999998, "r_x1": 286.365, "r_y1": 240.35199999999998, "r_x2": 286.365, "r_y2": 231.79999999999995, "r_x3": 62.067, "r_y3": 231.79999999999995, "coord_origin": "TOPLEFT"}, "text": "In this paper, we want to address these weaknesses and", "orig": "In this paper, we want to address these weaknesses and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 252.30700000000002, "r_x1": 78.884, "r_y1": 252.30700000000002, "r_x2": 78.884, "r_y2": 243.755, "r_x3": 50.112, "r_y3": 243.755, "coord_origin": "TOPLEFT"}, "text": "present", "orig": "present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 83.068, "r_y0": 252.30700000000002, "r_x1": 116.373, "r_y1": 252.30700000000002, "r_x2": 116.373, "r_y2": 243.755, "r_x3": 83.068, "r_y3": 243.755, "coord_origin": "TOPLEFT"}, "text": "a robust", "orig": "a robust", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 120.558, "r_y0": 252.30700000000002, "r_x1": 178.102, "r_y1": 252.30700000000002, "r_x2": 178.102, "r_y2": 243.755, "r_x3": 120.558, "r_y3": 243.755, "coord_origin": "TOPLEFT"}, "text": "table-structure", "orig": "table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.276, "r_y0": 252.30700000000002, "r_x1": 286.365, "r_y1": 252.30700000000002, "r_x2": 286.365, "r_y2": 243.755, "r_x3": 182.276, "r_y3": 243.755, "coord_origin": "TOPLEFT"}, "text": "decomposition algorithm.", "orig": "decomposition algorithm.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 264.26199999999994, "r_x1": 260.432, "r_y1": 264.26199999999994, "r_x2": 260.432, "r_y2": 255.71000000000004, "r_x3": 50.112, "r_y3": 255.71000000000004, "coord_origin": "TOPLEFT"}, "text": "The design criteria for our model are the following.", "orig": "The design criteria for our model are the following.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.603, "r_y0": 264.26199999999994, "r_x1": 286.365, "r_y1": 264.26199999999994, "r_x2": 286.365, "r_y2": 255.71000000000004, "r_x3": 265.603, "r_y3": 255.71000000000004, "coord_origin": "TOPLEFT"}, "text": "First,", "orig": "First,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 276.217, "r_x1": 286.365, "r_y1": 276.217, "r_x2": 286.365, "r_y2": 267.66499999999996, "r_x3": 50.112, "r_y3": 267.66499999999996, "coord_origin": "TOPLEFT"}, "text": "we want our algorithm to be language agnostic. In this way,", "orig": "we want our algorithm to be language agnostic. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 288.172, "r_x1": 286.365, "r_y1": 288.172, "r_x2": 286.365, "r_y2": 279.62, "r_x3": 50.112, "r_y3": 279.62, "coord_origin": "TOPLEFT"}, "text": "we can obtain the structure of any table, irregardless of the", "orig": "we can obtain the structure of any table, irregardless of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 300.128, "r_x1": 88.568, "r_y1": 300.128, "r_x2": 88.568, "r_y2": 291.576, "r_x3": 50.112, "r_y3": 291.576, "coord_origin": "TOPLEFT"}, "text": "language.", "orig": "language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 95.502, "r_y0": 300.128, "r_x1": 286.365, "r_y1": 300.128, "r_x2": 286.365, "r_y2": 291.576, "r_x3": 95.502, "r_y3": 291.576, "coord_origin": "TOPLEFT"}, "text": "Second, we want our algorithm to leverage as", "orig": "Second, we want our algorithm to leverage as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 312.083, "r_x1": 286.365, "r_y1": 312.083, "r_x2": 286.365, "r_y2": 303.531, "r_x3": 50.112, "r_y3": 303.531, "coord_origin": "TOPLEFT"}, "text": "much data as possible from the original PDF document. For", "orig": "much data as possible from the original PDF document. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 324.038, "r_x1": 286.365, "r_y1": 324.038, "r_x2": 286.365, "r_y2": 315.486, "r_x3": 50.112, "r_y3": 315.486, "coord_origin": "TOPLEFT"}, "text": "programmatic PDF documents, the text-cells can often be", "orig": "programmatic PDF documents, the text-cells can often be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 335.993, "r_x1": 286.365, "r_y1": 335.993, "r_x2": 286.365, "r_y2": 327.441, "r_x3": 50.112, "r_y3": 327.441, "coord_origin": "TOPLEFT"}, "text": "extracted much faster and with higher accuracy compared", "orig": "extracted much faster and with higher accuracy compared", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 347.948, "r_x1": 286.365, "r_y1": 347.948, "r_x2": 286.365, "r_y2": 339.396, "r_x3": 50.112, "r_y3": 339.396, "coord_origin": "TOPLEFT"}, "text": "to OCR methods. Last but not least, we want to have a di-", "orig": "to OCR methods. Last but not least, we want to have a di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 359.904, "r_x1": 286.365, "r_y1": 359.904, "r_x2": 286.365, "r_y2": 351.352, "r_x3": 50.112, "r_y3": 351.352, "coord_origin": "TOPLEFT"}, "text": "rect link between the table-cell and its bounding box in the", "orig": "rect link between the table-cell and its bounding box in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 371.859, "r_x1": 76.951, "r_y1": 371.859, "r_x2": 76.951, "r_y2": 363.307, "r_x3": 50.112, "r_y3": 363.307, "coord_origin": "TOPLEFT"}, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "text", "bbox": {"l": 50.112, "t": 375.715, "r": 286.367, "b": 432.087, "coord_origin": "TOPLEFT"}, "confidence": 0.9820111393928528, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 384.267, "r_x1": 286.365, "r_y1": 384.267, "r_x2": 286.365, "r_y2": 375.715, "r_x3": 62.067, "r_y3": 375.715, "coord_origin": "TOPLEFT"}, "text": "To meet the design criteria listed above, we developed a", "orig": "To meet the design criteria listed above, we developed a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 396.222, "r_x1": 120.986, "r_y1": 396.222, "r_x2": 120.986, "r_y2": 387.67, "r_x3": 50.112, "r_y3": 387.67, "coord_origin": "TOPLEFT"}, "text": "new model called", "orig": "new model called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 123.901, "r_y0": 396.238, "r_x1": 179.731, "r_y1": 396.238, "r_x2": 179.731, "r_y2": 387.282, "r_x3": 123.901, "r_y3": 387.282, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.646, "r_y0": 396.222, "r_x1": 286.367, "r_y1": 396.222, "r_x2": 286.367, "r_y2": 387.67, "r_x3": 182.646, "r_y3": 387.67, "coord_origin": "TOPLEFT"}, "text": "and a synthetically gener-", "orig": "and a synthetically gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 408.177, "r_x1": 181.758, "r_y1": 408.177, "r_x2": 181.758, "r_y2": 399.625, "r_x3": 50.112, "r_y3": 399.625, "coord_origin": "TOPLEFT"}, "text": "ated table structure dataset called", "orig": "ated table structure dataset called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.104, "r_y0": 408.193, "r_x1": 240.203, "r_y1": 408.193, "r_x2": 240.203, "r_y2": 399.237, "r_x3": 184.104, "r_y3": 399.237, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.204, "r_y0": 403.942, "r_x1": 243.691, "r_y1": 403.942, "r_x2": 243.691, "r_y2": 397.956, "r_x3": 240.204, "r_y3": 397.956, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 244.189, "r_y0": 408.177, "r_x1": 246.68, "r_y1": 408.177, "r_x2": 246.68, "r_y2": 399.625, "r_x3": 244.189, "r_y3": 399.625, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.718, "r_y0": 408.177, "r_x1": 286.361, "r_y1": 408.177, "r_x2": 286.361, "r_y2": 399.625, "r_x3": 249.718, "r_y3": 399.625, "coord_origin": "TOPLEFT"}, "text": "In partic-", "orig": "In partic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 420.132, "r_x1": 67.696, "r_y1": 420.132, "r_x2": 67.696, "r_y2": 411.58, "r_x3": 50.112, "r_y3": 411.58, "coord_origin": "TOPLEFT"}, "text": "ular,", "orig": "ular,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 71.322, "r_y0": 420.132, "r_x1": 286.365, "r_y1": 420.132, "r_x2": 286.365, "r_y2": 411.58, "r_x3": 71.322, "r_y3": 411.58, "coord_origin": "TOPLEFT"}, "text": "our contributions in this work can be summarised as", "orig": "our contributions in this work can be summarised as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 432.087, "r_x1": 82.52, "r_y1": 432.087, "r_x2": 82.52, "r_y2": 423.535, "r_x3": 50.112, "r_y3": 423.535, "coord_origin": "TOPLEFT"}, "text": "follows:", "orig": "follows:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "list_item", "bbox": {"l": 61.569, "t": 444.432, "r": 286.365, "b": 489.237, "coord_origin": "TOPLEFT"}, "confidence": 0.9822162389755249, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 453.372, "r_x1": 65.056, "r_y1": 453.372, "r_x2": 65.056, "r_y2": 444.82, "r_x3": 61.569, "r_y3": 444.82, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 453.372, "r_x1": 117.101, "r_y1": 453.372, "r_x2": 117.101, "r_y2": 444.82, "r_x3": 70.037, "r_y3": 444.82, "coord_origin": "TOPLEFT"}, "text": "We propose", "orig": "We propose", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.59, "r_y0": 453.388, "r_x1": 175.42, "r_y1": 453.388, "r_x2": 175.42, "r_y2": 444.432, "r_x3": 119.59, "r_y3": 444.432, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.421, "r_y0": 453.372, "r_x1": 286.365, "r_y1": 453.372, "r_x2": 286.365, "r_y2": 444.82, "r_x3": 175.421, "r_y3": 444.82, "coord_origin": "TOPLEFT"}, "text": ", a transformer based model", "orig": ", a transformer based model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 465.327, "r_x1": 286.365, "r_y1": 465.327, "r_x2": 286.365, "r_y2": 456.775, "r_x3": 70.037, "r_y3": 456.775, "coord_origin": "TOPLEFT"}, "text": "that predicts tables structure and bounding boxes for", "orig": "that predicts tables structure and bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 477.282, "r_x1": 286.365, "r_y1": 477.282, "r_x2": 286.365, "r_y2": 468.73, "r_x3": 70.037, "r_y3": 468.73, "coord_origin": "TOPLEFT"}, "text": "the table content simultaneously in an end-to-end ap-", "orig": "the table content simultaneously in an end-to-end ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 489.237, "r_x1": 99.636, "r_y1": 489.237, "r_x2": 99.636, "r_y2": 480.685, "r_x3": 70.037, "r_y3": 480.685, "coord_origin": "TOPLEFT"}, "text": "proach.", "orig": "proach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "list_item", "bbox": {"l": 61.569, "t": 502.034, "r": 286.365, "b": 546.84, "coord_origin": "TOPLEFT"}, "confidence": 0.982271671295166, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 510.974, "r_x1": 65.056, "r_y1": 510.974, "r_x2": 65.056, "r_y2": 502.422, "r_x3": 61.569, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 510.974, "r_x1": 111.88, "r_y1": 510.974, "r_x2": 111.88, "r_y2": 502.422, "r_x3": 70.037, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "Across all", "orig": "Across all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.084, "r_y0": 510.974, "r_x1": 196.104, "r_y1": 510.974, "r_x2": 196.104, "r_y2": 502.422, "r_x3": 116.084, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "benchmark datasets", "orig": "benchmark datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.31, "r_y0": 510.99, "r_x1": 256.14, "r_y1": 510.99, "r_x2": 256.14, "r_y2": 502.034, "r_x3": 200.31, "r_y3": 502.034, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 260.35, "r_y0": 510.974, "r_x1": 286.362, "r_y1": 510.974, "r_x2": 286.362, "r_y2": 502.422, "r_x3": 260.35, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "signif-", "orig": "signif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 522.929, "r_x1": 97.155, "r_y1": 522.929, "r_x2": 97.155, "r_y2": 514.377, "r_x3": 70.037, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "icantly", "orig": "icantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.678, "r_y0": 522.929, "r_x1": 150.375, "r_y1": 522.929, "r_x2": 150.375, "r_y2": 514.377, "r_x3": 101.678, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "outperforms", "orig": "outperforms", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.898, "r_y0": 522.929, "r_x1": 186.301, "r_y1": 522.929, "r_x2": 186.301, "r_y2": 514.377, "r_x3": 154.898, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "existing", "orig": "existing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 190.824, "r_y0": 522.929, "r_x1": 250.021, "r_y1": 522.929, "r_x2": 250.021, "r_y2": 514.377, "r_x3": 190.824, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "state-of-the-art", "orig": "state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 254.544, "r_y0": 522.929, "r_x1": 286.365, "r_y1": 522.929, "r_x2": 286.365, "r_y2": 514.377, "r_x3": 254.544, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "metrics,", "orig": "metrics,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 534.885, "r_x1": 286.365, "r_y1": 534.885, "r_x2": 286.365, "r_y2": 526.3330000000001, "r_x3": 70.037, "r_y3": 526.3330000000001, "coord_origin": "TOPLEFT"}, "text": "while being much more efficient in training and infer-", "orig": "while being much more efficient in training and infer-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 546.84, "r_x1": 161.653, "r_y1": 546.84, "r_x2": 161.653, "r_y2": 538.288, "r_x3": 70.037, "r_y3": 538.288, "coord_origin": "TOPLEFT"}, "text": "ence to existing works.", "orig": "ence to existing works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "list_item", "bbox": {"l": 61.569, "t": 559.637, "r": 286.365, "b": 592.487, "coord_origin": "TOPLEFT"}, "confidence": 0.9802963733673096, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 568.577, "r_x1": 65.056, "r_y1": 568.577, "r_x2": 65.056, "r_y2": 560.025, "r_x3": 61.569, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 568.577, "r_x1": 116.712, "r_y1": 568.577, "r_x2": 116.712, "r_y2": 560.025, "r_x3": 70.037, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "We present", "orig": "We present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 121.583, "r_y0": 568.593, "r_x1": 177.682, "r_y1": 568.593, "r_x2": 177.682, "r_y2": 559.637, "r_x3": 121.583, "r_y3": 559.637, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.553, "r_y0": 568.577, "r_x1": 186.976, "r_y1": 568.577, "r_x2": 186.976, "r_y2": 560.025, "r_x3": 182.553, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 191.848, "r_y0": 568.577, "r_x1": 242.767, "r_y1": 568.577, "r_x2": 242.767, "r_y2": 560.025, "r_x3": 191.848, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "synthetically", "orig": "synthetically", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.639, "r_y0": 568.577, "r_x1": 286.363, "r_y1": 568.577, "r_x2": 286.363, "r_y2": 560.025, "r_x3": 247.639, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "generated", "orig": "generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 580.532, "r_x1": 286.365, "r_y1": 580.532, "r_x2": 286.365, "r_y2": 571.98, "r_x3": 70.037, "r_y3": 571.98, "coord_origin": "TOPLEFT"}, "text": "dataset, with various appearance styles and complex-", "orig": "dataset, with various appearance styles and complex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 592.487, "r_x1": 82.401, "r_y1": 592.487, "r_x2": 82.401, "r_y2": 583.935, "r_x3": 70.037, "r_y3": 583.935, "coord_origin": "TOPLEFT"}, "text": "ity.", "orig": "ity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "list_item", "bbox": {"l": 61.569, "t": 605.672, "r": 286.365, "b": 638.135, "coord_origin": "TOPLEFT"}, "confidence": 0.9806395173072815, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 614.2239999999999, "r_x1": 65.056, "r_y1": 614.2239999999999, "r_x2": 65.056, "r_y2": 605.672, "r_x3": 61.569, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 614.2239999999999, "r_x1": 132.005, "r_y1": 614.2239999999999, "r_x2": 132.005, "r_y2": 605.672, "r_x3": 70.037, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "An augmented", "orig": "An augmented", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.082, "r_y0": 614.2239999999999, "r_x1": 165.748, "r_y1": 614.2239999999999, "r_x2": 165.748, "r_y2": 605.672, "r_x3": 138.082, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "dataset", "orig": "dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.815, "r_y0": 614.2239999999999, "r_x1": 194.5, "r_y1": 614.2239999999999, "r_x2": 194.5, "r_y2": 605.672, "r_x3": 171.815, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "based", "orig": "based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.577, "r_y0": 614.2239999999999, "r_x1": 210.54, "r_y1": 614.2239999999999, "r_x2": 210.54, "r_y2": 605.672, "r_x3": 200.577, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "on", "orig": "on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.617, "r_y0": 614.2239999999999, "r_x1": 261.2, "r_y1": 614.2239999999999, "r_x2": 261.2, "r_y2": 605.672, "r_x3": 216.617, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 267.277, "r_y0": 614.2239999999999, "r_x1": 286.365, "r_y1": 614.2239999999999, "r_x2": 286.365, "r_y2": 605.672, "r_x3": 267.277, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "[37],", "orig": "[37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 626.179, "r_x1": 135.521, "r_y1": 626.179, "r_x2": 135.521, "r_y2": 617.627, "r_x3": 70.037, "r_y3": 617.627, "coord_origin": "TOPLEFT"}, "text": "FinTabNet [36],", "orig": "FinTabNet [36],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.925, "r_y0": 626.179, "r_x1": 286.365, "r_y1": 626.179, "r_x2": 286.365, "r_y2": 617.627, "r_x3": 139.925, "r_y3": 617.627, "coord_origin": "TOPLEFT"}, "text": "and TableBank [17] with generated", "orig": "and TableBank [17] with generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 638.135, "r_x1": 198.056, "r_y1": 638.135, "r_x2": 198.056, "r_y2": 629.583, "r_x3": 70.037, "r_y3": 629.583, "coord_origin": "TOPLEFT"}, "text": "ground-truth for reproducibility.", "orig": "ground-truth for reproducibility.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "text", "bbox": {"l": 50.112, "t": 650.867, "r": 286.365, "b": 695.284, "coord_origin": "TOPLEFT"}, "confidence": 0.9742533564567566, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 659.419, "r_x1": 204.452, "r_y1": 659.419, "r_x2": 204.452, "r_y2": 650.867, "r_x3": 62.067, "r_y3": 650.867, "coord_origin": "TOPLEFT"}, "text": "The paper is structured as follows.", "orig": "The paper is structured as follows.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.789, "r_y0": 659.419, "r_x1": 286.365, "r_y1": 659.419, "r_x2": 286.365, "r_y2": 650.867, "r_x3": 210.789, "r_y3": 650.867, "coord_origin": "TOPLEFT"}, "text": "In Sec. 2, we give", "orig": "In Sec. 2, we give", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 671.374, "r_x1": 240.896, "r_y1": 671.374, "r_x2": 240.896, "r_y2": 662.822, "r_x3": 50.112, "r_y3": 662.822, "coord_origin": "TOPLEFT"}, "text": "a brief overview of the current state-of-the-art.", "orig": "a brief overview of the current state-of-the-art.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.833, "r_y0": 671.374, "r_x1": 286.365, "r_y1": 671.374, "r_x2": 286.365, "r_y2": 662.822, "r_x3": 246.833, "r_y3": 662.822, "coord_origin": "TOPLEFT"}, "text": "In Sec. 3,", "orig": "In Sec. 3,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 683.329, "r_x1": 227.396, "r_y1": 683.329, "r_x2": 227.396, "r_y2": 674.777, "r_x3": 50.112, "r_y3": 674.777, "coord_origin": "TOPLEFT"}, "text": "we describe the datasets on which we train.", "orig": "we describe the datasets on which we train.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.467, "r_y0": 683.329, "r_x1": 286.365, "r_y1": 683.329, "r_x2": 286.365, "r_y2": 674.777, "r_x3": 232.467, "r_y3": 674.777, "coord_origin": "TOPLEFT"}, "text": "In Sec. 4, we", "orig": "In Sec. 4, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 695.284, "r_x1": 286.365, "r_y1": 695.284, "r_x2": 286.365, "r_y2": 686.732, "r_x3": 50.112, "r_y3": 686.732, "coord_origin": "TOPLEFT"}, "text": "introduce the TableFormer model-architecture and describe", "orig": "introduce the TableFormer model-architecture and describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "footnote", "bbox": {"l": 60.971, "t": 704.296, "r": 183.731, "b": 712.653, "coord_origin": "TOPLEFT"}, "confidence": 0.895367443561554, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.971, "r_y0": 709.427, "r_x1": 63.96, "r_y1": 709.427, "r_x2": 63.96, "r_y2": 704.296, "r_x3": 60.971, "r_y3": 704.296, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 64.458, "r_y0": 712.653, "r_x1": 183.731, "r_y1": 712.653, "r_x2": 183.731, "r_y2": 705.811, "r_x3": 64.458, "r_y3": 705.811, "coord_origin": "TOPLEFT"}, "text": "https://github.com/IBM/SynthTabNet", "orig": "https://github.com/IBM/SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 10, "label": "text", "bbox": {"l": 308.862, "t": 75.47699999999998, "r": 545.115, "b": 107.93899999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9774322509765625, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 545.115, "r_y1": 84.029, "r_x2": 545.115, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "its results &performance in Sec. 5. As a conclusion, we de-", "orig": "its results &performance in Sec. 5. As a conclusion, we de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 95.98400000000004, "r_x1": 545.115, "r_y1": 95.98400000000004, "r_x2": 545.115, "r_y2": 87.43200000000002, "r_x3": 308.862, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "scribe how this new model-architecture can be re-purposed", "orig": "scribe how this new model-architecture can be re-purposed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 107.93899999999996, "r_x1": 508.084, "r_y1": 107.93899999999996, "r_x2": 508.084, "r_y2": 99.38699999999994, "r_x3": 308.862, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "for other tasks in the computer-vision community.", "orig": "for other tasks in the computer-vision community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "section_header", "bbox": {"l": 308.862, "t": 121.73199999999997, "r": 498.28, "b": 132.48000000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9428724646568298, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 132.48000000000002, "r_x1": 498.28, "r_y1": 132.48000000000002, "r_x2": 498.28, "r_y2": 121.73199999999997, "r_x3": 308.862, "r_y3": 121.73199999999997, "coord_origin": "TOPLEFT"}, "text": "2. Previous work and State of the Art", "orig": "2. Previous work and State of the Art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 308.862, "t": 142.49, "r": 545.115, "b": 330.369, "coord_origin": "TOPLEFT"}, "confidence": 0.987194836139679, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 151.04200000000003, "r_x1": 545.115, "r_y1": 151.04200000000003, "r_x2": 545.115, "r_y2": 142.49, "r_x3": 320.817, "r_y3": 142.49, "coord_origin": "TOPLEFT"}, "text": "Identifying the structure of a table has been an outstand-", "orig": "Identifying the structure of a table has been an outstand-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 162.99699999999996, "r_x1": 545.115, "r_y1": 162.99699999999996, "r_x2": 545.115, "r_y2": 154.44500000000005, "r_x3": 308.862, "r_y3": 154.44500000000005, "coord_origin": "TOPLEFT"}, "text": "ing problem in the document-parsing community, that mo-", "orig": "ing problem in the document-parsing community, that mo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 174.952, "r_x1": 334.376, "r_y1": 174.952, "r_x2": 334.376, "r_y2": 166.39999999999998, "r_x3": 308.862, "r_y3": 166.39999999999998, "coord_origin": "TOPLEFT"}, "text": "tivates", "orig": "tivates", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.192, "r_y0": 174.952, "r_x1": 522.56, "r_y1": 174.952, "r_x2": 522.56, "r_y2": 166.39999999999998, "r_x3": 338.192, "r_y3": 166.39999999999998, "coord_origin": "TOPLEFT"}, "text": "many organised public challenges [6, 4, 14].", "orig": "many organised public challenges [6, 4, 14].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 529.623, "r_y0": 174.952, "r_x1": 545.115, "r_y1": 174.952, "r_x2": 545.115, "r_y2": 166.39999999999998, "r_x3": 529.623, "r_y3": 166.39999999999998, "coord_origin": "TOPLEFT"}, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 186.90700000000004, "r_x1": 545.115, "r_y1": 186.90700000000004, "r_x2": 545.115, "r_y2": 178.35500000000002, "r_x3": 308.862, "r_y3": 178.35500000000002, "coord_origin": "TOPLEFT"}, "text": "difficulty of the problem can be attributed to a number of", "orig": "difficulty of the problem can be attributed to a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 198.86199999999997, "r_x1": 545.115, "r_y1": 198.86199999999997, "r_x2": 545.115, "r_y2": 190.30999999999995, "r_x3": 308.862, "r_y3": 190.30999999999995, "coord_origin": "TOPLEFT"}, "text": "factors. First, there is a large variety in the shapes and sizes", "orig": "factors. First, there is a large variety in the shapes and sizes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 210.817, "r_x1": 346.979, "r_y1": 210.817, "r_x2": 346.979, "r_y2": 202.265, "r_x3": 308.862, "r_y3": 202.265, "coord_origin": "TOPLEFT"}, "text": "of tables.", "orig": "of tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.869, "r_y0": 210.817, "r_x1": 508.642, "r_y1": 210.817, "r_x2": 508.642, "r_y2": 202.265, "r_x3": 354.869, "r_y3": 202.265, "coord_origin": "TOPLEFT"}, "text": "Such large variety requires a flexible", "orig": "Such large variety requires a flexible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.737, "r_y0": 210.817, "r_x1": 545.115, "r_y1": 210.817, "r_x2": 545.115, "r_y2": 202.265, "r_x3": 512.737, "r_y3": 202.265, "coord_origin": "TOPLEFT"}, "text": "method.", "orig": "method.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 222.77300000000002, "r_x1": 545.115, "r_y1": 222.77300000000002, "r_x2": 545.115, "r_y2": 214.221, "r_x3": 308.862, "r_y3": 214.221, "coord_origin": "TOPLEFT"}, "text": "This is especially true for complex column- and row head-", "orig": "This is especially true for complex column- and row head-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 234.72799999999995, "r_x1": 322.969, "r_y1": 234.72799999999995, "r_x2": 322.969, "r_y2": 226.17600000000004, "r_x3": 308.862, "r_y3": 226.17600000000004, "coord_origin": "TOPLEFT"}, "text": "ers,", "orig": "ers,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.084, "r_y0": 234.72799999999995, "r_x1": 530.918, "r_y1": 234.72799999999995, "r_x2": 530.918, "r_y2": 226.17600000000004, "r_x3": 327.084, "r_y3": 226.17600000000004, "coord_origin": "TOPLEFT"}, "text": "which can be extremely intricate and demanding.", "orig": "which can be extremely intricate and demanding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 537.922, "r_y0": 234.72799999999995, "r_x1": 545.115, "r_y1": 234.72799999999995, "r_x2": 545.115, "r_y2": 226.17600000000004, "r_x3": 537.922, "r_y3": 226.17600000000004, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 246.683, "r_x1": 545.115, "r_y1": 246.683, "r_x2": 545.115, "r_y2": 238.13099999999997, "r_x3": 308.862, "r_y3": 238.13099999999997, "coord_origin": "TOPLEFT"}, "text": "second factor of complexity is the lack of data with regard", "orig": "second factor of complexity is the lack of data with regard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.63800000000003, "r_x1": 545.115, "r_y1": 258.63800000000003, "r_x2": 545.115, "r_y2": 250.086, "r_x3": 308.862, "r_y3": 250.086, "coord_origin": "TOPLEFT"}, "text": "to table-structure. Until the publication of PubTabNet [37],", "orig": "to table-structure. Until the publication of PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 270.59299999999996, "r_x1": 439.84, "r_y1": 270.59299999999996, "r_x2": 439.84, "r_y2": 262.04100000000005, "r_x3": 308.862, "r_y3": 262.04100000000005, "coord_origin": "TOPLEFT"}, "text": "there were no large datasets (i.e.", "orig": "there were no large datasets (i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 444.44, "r_y0": 270.429, "r_x1": 452.189, "r_y1": 270.429, "r_x2": 452.189, "r_y2": 261.72299999999996, "r_x3": 444.44, "r_y3": 261.72299999999996, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.89, "r_y0": 270.429, "r_x1": 470.834, "r_y1": 270.429, "r_x2": 470.834, "r_y2": 261.72299999999996, "r_x3": 455.89, "r_y3": 261.72299999999996, "coord_origin": "TOPLEFT"}, "text": "100", "orig": "100", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 470.834, "r_y0": 270.59299999999996, "r_x1": 545.115, "r_y1": 270.59299999999996, "r_x2": 545.115, "r_y2": 262.04100000000005, "r_x3": 470.834, "r_y3": 262.04100000000005, "coord_origin": "TOPLEFT"}, "text": "K tables) that pro-", "orig": "K tables) that pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 282.548, "r_x1": 545.115, "r_y1": 282.548, "r_x2": 545.115, "r_y2": 273.996, "r_x3": 308.862, "r_y3": 273.996, "coord_origin": "TOPLEFT"}, "text": "vided structure information. This happens primarily due to", "orig": "vided structure information. This happens primarily due to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 294.504, "r_x1": 545.115, "r_y1": 294.504, "r_x2": 545.115, "r_y2": 285.952, "r_x3": 308.862, "r_y3": 285.952, "coord_origin": "TOPLEFT"}, "text": "the fact that tables are notoriously time-consuming to an-", "orig": "the fact that tables are notoriously time-consuming to an-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 306.459, "r_x1": 545.115, "r_y1": 306.459, "r_x2": 545.115, "r_y2": 297.907, "r_x3": 308.862, "r_y3": 297.907, "coord_origin": "TOPLEFT"}, "text": "notate by hand. However, this has definitely changed in re-", "orig": "notate by hand. However, this has definitely changed in re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 318.414, "r_x1": 545.115, "r_y1": 318.414, "r_x2": 545.115, "r_y2": 309.862, "r_x3": 308.862, "r_y3": 309.862, "coord_origin": "TOPLEFT"}, "text": "cent years with the deliverance of PubTabNet [37], FinTab-", "orig": "cent years with the deliverance of PubTabNet [37], FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 330.369, "r_x1": 425.923, "r_y1": 330.369, "r_x2": 425.923, "r_y2": 321.817, "r_x3": 308.862, "r_y3": 321.817, "coord_origin": "TOPLEFT"}, "text": "Net [36], TableBank [17] etc.", "orig": "Net [36], TableBank [17] etc.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 308.862, "t": 333.838, "r": 545.115, "b": 449.987, "coord_origin": "TOPLEFT"}, "confidence": 0.9869040250778198, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 342.39, "r_x1": 391.492, "r_y1": 342.39, "r_x2": 391.492, "r_y2": 333.838, "r_x3": 320.817, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "Before the rising", "orig": "Before the rising", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.845, "r_y0": 342.39, "r_x1": 436.802, "r_y1": 342.39, "r_x2": 436.802, "r_y2": 333.838, "r_x3": 395.845, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "popularity", "orig": "popularity", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.145, "r_y0": 342.39, "r_x1": 449.444, "r_y1": 342.39, "r_x2": 449.444, "r_y2": 333.838, "r_x3": 441.145, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.798, "r_y0": 342.39, "r_x1": 545.115, "r_y1": 342.39, "r_x2": 545.115, "r_y2": 333.838, "r_x3": 453.798, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "deep neural networks,", "orig": "deep neural networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 354.345, "r_x1": 545.115, "r_y1": 354.345, "r_x2": 545.115, "r_y2": 345.793, "r_x3": 308.862, "r_y3": 345.793, "coord_origin": "TOPLEFT"}, "text": "the community relied heavily on heuristic and/or statistical", "orig": "the community relied heavily on heuristic and/or statistical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 366.3, "r_x1": 545.115, "r_y1": 366.3, "r_x2": 545.115, "r_y2": 357.748, "r_x3": 308.862, "r_y3": 357.748, "coord_origin": "TOPLEFT"}, "text": "methods to do table structure identification [3, 7, 11, 5, 13,", "orig": "methods to do table structure identification [3, 7, 11, 5, 13,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 378.256, "r_x1": 324.633, "r_y1": 378.256, "r_x2": 324.633, "r_y2": 369.704, "r_x3": 308.862, "r_y3": 369.704, "coord_origin": "TOPLEFT"}, "text": "28].", "orig": "28].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 329.634, "r_y0": 378.256, "r_x1": 545.115, "r_y1": 378.256, "r_x2": 545.115, "r_y2": 369.704, "r_x3": 329.634, "r_y3": 369.704, "coord_origin": "TOPLEFT"}, "text": "Although such methods work well on constrained ta-", "orig": "Although such methods work well on constrained ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 390.211, "r_x1": 545.115, "r_y1": 390.211, "r_x2": 545.115, "r_y2": 381.659, "r_x3": 308.862, "r_y3": 381.659, "coord_origin": "TOPLEFT"}, "text": "bles [12], a more data-driven approach can be applied due", "orig": "bles [12], a more data-driven approach can be applied due", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 402.166, "r_x1": 545.115, "r_y1": 402.166, "r_x2": 545.115, "r_y2": 393.614, "r_x3": 308.862, "r_y3": 393.614, "coord_origin": "TOPLEFT"}, "text": "to the advent of convolutional neural networks (CNNs) and", "orig": "to the advent of convolutional neural networks (CNNs) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 414.121, "r_x1": 438.416, "r_y1": 414.121, "r_x2": 438.416, "r_y2": 405.569, "r_x3": 308.862, "r_y3": 405.569, "coord_origin": "TOPLEFT"}, "text": "the availability of large datasets.", "orig": "the availability of large datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.231, "r_y0": 414.121, "r_x1": 545.115, "r_y1": 414.121, "r_x2": 545.115, "r_y2": 405.569, "r_x3": 442.231, "r_y3": 405.569, "coord_origin": "TOPLEFT"}, "text": "To the best-of-our knowl-", "orig": "To the best-of-our knowl-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 426.076, "r_x1": 545.115, "r_y1": 426.076, "r_x2": 545.115, "r_y2": 417.524, "r_x3": 308.862, "r_y3": 417.524, "coord_origin": "TOPLEFT"}, "text": "edge, there are currently two different types of network ar-", "orig": "edge, there are currently two different types of network ar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 438.032, "r_x1": 545.115, "r_y1": 438.032, "r_x2": 545.115, "r_y2": 429.48, "r_x3": 308.862, "r_y3": 429.48, "coord_origin": "TOPLEFT"}, "text": "chitecture that are being pursued for state-of-the-art table-", "orig": "chitecture that are being pursued for state-of-the-art table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 449.987, "r_x1": 401.285, "r_y1": 449.987, "r_x2": 401.285, "r_y2": 441.435, "r_x3": 308.862, "r_y3": 441.435, "coord_origin": "TOPLEFT"}, "text": "structure identification.", "orig": "structure identification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 308.862, "t": 453.068, "r": 545.117, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9843218326568604, "cells": [{"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 462.024, "r_x1": 423.262, "r_y1": 462.024, "r_x2": 423.262, "r_y2": 453.068, "r_x3": 320.817, "r_y3": 453.068, "coord_origin": "TOPLEFT"}, "text": "Image-to-Text networks", "orig": "Image-to-Text networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.267, "r_y0": 462.008, "r_x1": 426.037, "r_y1": 462.008, "r_x2": 426.037, "r_y2": 453.456, "r_x3": 423.267, "r_y3": 453.456, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.769, "r_y0": 462.008, "r_x1": 545.11, "r_y1": 462.008, "r_x2": 545.11, "r_y2": 453.456, "r_x3": 430.769, "r_y3": 453.456, "coord_origin": "TOPLEFT"}, "text": "In this type of network, one", "orig": "In this type of network, one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 473.963, "r_x1": 340.404, "r_y1": 473.963, "r_x2": 340.404, "r_y2": 465.411, "r_x3": 308.862, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "predicts", "orig": "predicts", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.116, "r_y0": 473.963, "r_x1": 349.539, "r_y1": 473.963, "r_x2": 349.539, "r_y2": 465.411, "r_x3": 345.116, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.252, "r_y0": 473.963, "r_x1": 390.765, "r_y1": 473.963, "r_x2": 390.765, "r_y2": 465.411, "r_x3": 354.252, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "sequence", "orig": "sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.477, "r_y0": 473.963, "r_x1": 403.776, "r_y1": 473.963, "r_x2": 403.776, "r_y2": 465.411, "r_x3": 395.477, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.488, "r_y0": 473.963, "r_x1": 434.401, "r_y1": 473.963, "r_x2": 434.401, "r_y2": 465.411, "r_x3": 408.488, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.113, "r_y0": 473.963, "r_x1": 469.001, "r_y1": 473.963, "r_x2": 469.001, "r_y2": 465.411, "r_x3": 439.113, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "starting", "orig": "starting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 473.713, "r_y0": 473.963, "r_x1": 545.115, "r_y1": 473.963, "r_x2": 545.115, "r_y2": 465.411, "r_x3": 473.713, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "from an encoded", "orig": "from an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 485.918, "r_x1": 335.701, "r_y1": 485.918, "r_x2": 335.701, "r_y2": 477.366, "r_x3": 308.862, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.853, "r_y0": 485.918, "r_x1": 411.009, "r_y1": 485.918, "r_x2": 411.009, "r_y2": 477.366, "r_x3": 345.853, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "Such sequences", "orig": "Such sequences", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 415.85, "r_y0": 485.918, "r_x1": 424.149, "r_y1": 485.918, "r_x2": 424.149, "r_y2": 477.366, "r_x3": 415.85, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.001, "r_y0": 485.918, "r_x1": 454.914, "r_y1": 485.918, "r_x2": 454.914, "r_y2": 477.366, "r_x3": 429.001, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.756, "r_y0": 485.918, "r_x1": 473.584, "r_y1": 485.918, "r_x2": 473.584, "r_y2": 477.366, "r_x3": 459.756, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "can", "orig": "can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.425, "r_y0": 485.918, "r_x1": 487.83, "r_y1": 485.918, "r_x2": 487.83, "r_y2": 477.366, "r_x3": 478.425, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "be", "orig": "be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 492.682, "r_y0": 485.918, "r_x1": 545.115, "r_y1": 485.918, "r_x2": 545.115, "r_y2": 477.366, "r_x3": 492.682, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "HTML table", "orig": "HTML table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 497.873, "r_x1": 459.218, "r_y1": 497.873, "r_x2": 459.218, "r_y2": 489.321, "r_x3": 308.862, "r_y3": 489.321, "coord_origin": "TOPLEFT"}, "text": "tags [37, 17] or LaTeX symbols[10].", "orig": "tags [37, 17] or LaTeX symbols[10].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.115, "r_y0": 497.873, "r_x1": 545.115, "r_y1": 497.873, "r_x2": 545.115, "r_y2": 489.321, "r_x3": 465.115, "r_y3": 489.321, "coord_origin": "TOPLEFT"}, "text": "The choice of sym-", "orig": "The choice of sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 509.828, "r_x1": 545.115, "r_y1": 509.828, "r_x2": 545.115, "r_y2": 501.276, "r_x3": 308.862, "r_y3": 501.276, "coord_origin": "TOPLEFT"}, "text": "bols is ultimately not very important, since one can be trans-", "orig": "bols is ultimately not very important, since one can be trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 521.784, "r_x1": 396.692, "r_y1": 521.784, "r_x2": 396.692, "r_y2": 513.232, "r_x3": 308.862, "r_y3": 513.232, "coord_origin": "TOPLEFT"}, "text": "formed into the other.", "orig": "formed into the other.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.265, "r_y0": 521.784, "r_x1": 545.115, "r_y1": 521.784, "r_x2": 545.115, "r_y2": 513.232, "r_x3": 401.265, "r_y3": 513.232, "coord_origin": "TOPLEFT"}, "text": "There are however subtle variations", "orig": "There are however subtle variations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.739, "r_x1": 433.484, "r_y1": 533.739, "r_x2": 433.484, "r_y2": 525.187, "r_x3": 308.862, "r_y3": 525.187, "coord_origin": "TOPLEFT"}, "text": "in the Image-to-Text networks.", "orig": "in the Image-to-Text networks.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 438.187, "r_y0": 533.739, "r_x1": 545.115, "r_y1": 533.739, "r_x2": 545.115, "r_y2": 525.187, "r_x3": 438.187, "r_y3": 525.187, "coord_origin": "TOPLEFT"}, "text": "The easiest network archi-", "orig": "The easiest network archi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.694, "r_x1": 420.941, "r_y1": 545.694, "r_x2": 420.941, "r_y2": 537.142, "r_x3": 308.862, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "tectures are 'image-encoder", "orig": "tectures are 'image-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.595, "r_y0": 545.388, "r_x1": 433.558, "r_y1": 545.388, "r_x2": 433.558, "r_y2": 536.8240000000001, "r_x3": 423.595, "r_y3": 536.8240000000001, "coord_origin": "TOPLEFT"}, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.212, "r_y0": 545.694, "r_x1": 545.113, "r_y1": 545.694, "r_x2": 545.113, "r_y2": 537.142, "r_x3": 436.212, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "text-decoder' (IETD), sim-", "orig": "text-decoder' (IETD), sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 557.649, "r_x1": 545.115, "r_y1": 557.649, "r_x2": 545.115, "r_y2": 549.097, "r_x3": 308.862, "r_y3": 549.097, "coord_origin": "TOPLEFT"}, "text": "ilar to network architectures that try to provide captions to", "orig": "ilar to network architectures that try to provide captions to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.604, "r_x1": 545.115, "r_y1": 569.604, "r_x2": 545.115, "r_y2": 561.052, "r_x3": 308.862, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "images [32]. In these IETD networks, one expects as output", "orig": "images [32]. In these IETD networks, one expects as output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 581.559, "r_x1": 503.671, "r_y1": 581.559, "r_x2": 503.671, "r_y2": 573.0070000000001, "r_x3": 308.862, "r_y3": 573.0070000000001, "coord_origin": "TOPLEFT"}, "text": "the LaTeX/HTML string of the entire table, i.e.", "orig": "the LaTeX/HTML string of the entire table, i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 509.579, "r_y0": 581.559, "r_x1": 545.115, "r_y1": 581.559, "r_x2": 545.115, "r_y2": 573.0070000000001, "r_x3": 509.579, "r_y3": 573.0070000000001, "coord_origin": "TOPLEFT"}, "text": "the sym-", "orig": "the sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 593.515, "r_x1": 545.115, "r_y1": 593.515, "r_x2": 545.115, "r_y2": 584.963, "r_x3": 308.862, "r_y3": 584.963, "coord_origin": "TOPLEFT"}, "text": "bols necessary for creating the table with the content of the", "orig": "bols necessary for creating the table with the content of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.47, "r_x1": 330.72, "r_y1": 605.47, "r_x2": 330.72, "r_y2": 596.918, "r_x3": 308.862, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "table.", "orig": "table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.536, "r_y0": 605.47, "r_x1": 497.075, "r_y1": 605.47, "r_x2": 497.075, "r_y2": 596.918, "r_x3": 334.536, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "Another approach is the 'image-encoder", "orig": "Another approach is the 'image-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 499.805, "r_y0": 605.164, "r_x1": 509.768, "r_y1": 605.164, "r_x2": 509.768, "r_y2": 596.6, "r_x3": 499.805, "r_y3": 596.6, "coord_origin": "TOPLEFT"}, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.501, "r_y0": 605.47, "r_x1": 545.109, "r_y1": 605.47, "r_x2": 545.109, "r_y2": 596.918, "r_x3": 512.501, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "dual de-", "orig": "dual de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.425, "r_x1": 545.115, "r_y1": 617.425, "r_x2": 545.115, "r_y2": 608.873, "r_x3": 308.862, "r_y3": 608.873, "coord_origin": "TOPLEFT"}, "text": "coder' (IEDD) networks. In these type of networks, one has", "orig": "coder' (IEDD) networks. In these type of networks, one has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.38, "r_x1": 545.115, "r_y1": 629.38, "r_x2": 545.115, "r_y2": 620.828, "r_x3": 308.862, "r_y3": 620.828, "coord_origin": "TOPLEFT"}, "text": "two consecutive decoders with different purposes. The first", "orig": "two consecutive decoders with different purposes. The first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.335, "r_x1": 364.782, "r_y1": 641.335, "r_x2": 364.782, "r_y2": 632.783, "r_x3": 308.862, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "decoder is the", "orig": "decoder is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.574, "r_y0": 641.192, "r_x1": 415.614, "r_y1": 641.192, "r_x2": 415.614, "r_y2": 632.604, "r_x3": 367.574, "r_y3": 632.604, "coord_origin": "TOPLEFT"}, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 415.613, "r_y0": 641.335, "r_x1": 418.104, "r_y1": 641.335, "r_x2": 418.104, "r_y2": 632.783, "r_x3": 415.613, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 420.963, "r_y0": 641.335, "r_x1": 433.137, "r_y1": 641.335, "r_x2": 433.137, "r_y2": 632.783, "r_x3": 420.963, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "i.e.", "orig": "i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.122, "r_y0": 641.335, "r_x1": 442.661, "r_y1": 641.335, "r_x2": 442.661, "r_y2": 632.783, "r_x3": 437.122, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 445.441, "r_y0": 641.335, "r_x1": 545.117, "r_y1": 641.335, "r_x2": 545.117, "r_y2": 632.783, "r_x3": 445.441, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "only produces the HTM-", "orig": "only produces the HTM-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.29, "r_x1": 545.115, "r_y1": 653.29, "r_x2": 545.115, "r_y2": 644.738, "r_x3": 308.862, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "L/LaTeX tags which construct an empty table. The second", "orig": "L/LaTeX tags which construct an empty table. The second", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 665.103, "r_x1": 373.599, "r_y1": 665.103, "r_x2": 373.599, "r_y2": 656.515, "r_x3": 308.862, "r_y3": 656.515, "coord_origin": "TOPLEFT"}, "text": "content-decoder", "orig": "content-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.907, "r_y0": 665.246, "r_x1": 545.116, "r_y1": 665.246, "r_x2": 545.116, "r_y2": 656.694, "r_x3": 376.907, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "uses the encoding of the image in combi-", "orig": "uses the encoding of the image in combi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 308.862, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "nation with the output encoding of each cell-tag (from the", "orig": "nation with the output encoding of each cell-tag (from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.013, "r_x1": 356.902, "r_y1": 689.013, "r_x2": 356.902, "r_y2": 680.425, "r_x3": 308.862, "r_y3": 680.425, "coord_origin": "TOPLEFT"}, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.131, "r_y0": 689.156, "r_x1": 360.449, "r_y1": 689.156, "r_x2": 360.449, "r_y2": 680.604, "r_x3": 357.131, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 364.045, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 364.045, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "to generate the textual content of each table", "orig": "to generate the textual content of each table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 325.739, "r_y1": 701.111, "r_x2": 325.739, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "cell.", "orig": "cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.746, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 331.746, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "The network architecture of IEDD is certainly more", "orig": "The network architecture of IEDD is certainly more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "elaborate, but it has the advantage that one can pre-train the", "orig": "elaborate, but it has the advantage that one can pre-train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8778094053268433, "cells": [{"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "text", "id": 12, "page_no": 1, "cluster": {"id": 12, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 286.365, "b": 95.98400000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9656890034675598, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "considered as a solved problem, given enough ground-truth", "orig": "considered as a solved problem, given enough ground-truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 95.98400000000004, "r_x1": 112.647, "r_y1": 95.98400000000004, "r_x2": 112.647, "r_y2": 87.43200000000002, "r_x3": 50.112, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "data to train on.", "orig": "data to train on.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "considered as a solved problem, given enough ground-truth data to train on."}, {"label": "text", "id": 4, "page_no": 1, "cluster": {"id": 4, "label": "text", "bbox": {"l": 50.112, "t": 99.84000000000003, "r": 286.365, "b": 227.94399999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9838606119155884, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 108.39200000000005, "r_x1": 286.365, "r_y1": 108.39200000000005, "r_x2": 286.365, "r_y2": 99.84000000000003, "r_x3": 62.067, "r_y3": 99.84000000000003, "coord_origin": "TOPLEFT"}, "text": "The second problem is called table-structure decompo-", "orig": "The second problem is called table-structure decompo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 120.34699999999998, "r_x1": 74.75, "r_y1": 120.34699999999998, "r_x2": 74.75, "r_y2": 111.79499999999996, "r_x3": 50.112, "r_y3": 111.79499999999996, "coord_origin": "TOPLEFT"}, "text": "sition.", "orig": "sition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.335, "r_y0": 120.34699999999998, "r_x1": 286.365, "r_y1": 120.34699999999998, "r_x2": 286.365, "r_y2": 111.79499999999996, "r_x3": 81.335, "r_y3": 111.79499999999996, "coord_origin": "TOPLEFT"}, "text": "The latter is a long standing problem in the com-", "orig": "The latter is a long standing problem in the com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 132.30200000000002, "r_x1": 235.117, "r_y1": 132.30200000000002, "r_x2": 235.117, "r_y2": 123.75, "r_x3": 50.112, "r_y3": 123.75, "coord_origin": "TOPLEFT"}, "text": "munity of document understanding [6, 4, 14].", "orig": "munity of document understanding [6, 4, 14].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.079, "r_y0": 132.30200000000002, "r_x1": 286.365, "r_y1": 132.30200000000002, "r_x2": 286.365, "r_y2": 123.75, "r_x3": 240.079, "r_y3": 123.75, "coord_origin": "TOPLEFT"}, "text": "Contrary to", "orig": "Contrary to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 144.25699999999995, "r_x1": 286.365, "r_y1": 144.25699999999995, "r_x2": 286.365, "r_y2": 135.70500000000004, "r_x3": 50.112, "r_y3": 135.70500000000004, "coord_origin": "TOPLEFT"}, "text": "the table-location problem, there are no commonly used ap-", "orig": "the table-location problem, there are no commonly used ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 156.21299999999997, "r_x1": 286.365, "r_y1": 156.21299999999997, "r_x2": 286.365, "r_y2": 147.66099999999994, "r_x3": 50.112, "r_y3": 147.66099999999994, "coord_origin": "TOPLEFT"}, "text": "proaches that can easily be re-purposed to solve this prob-", "orig": "proaches that can easily be re-purposed to solve this prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 168.168, "r_x1": 286.365, "r_y1": 168.168, "r_x2": 286.365, "r_y2": 159.61599999999999, "r_x3": 50.112, "r_y3": 159.61599999999999, "coord_origin": "TOPLEFT"}, "text": "lem. Lately, a set of new model-architectures has been pro-", "orig": "lem. Lately, a set of new model-architectures has been pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 180.12300000000005, "r_x1": 286.365, "r_y1": 180.12300000000005, "r_x2": 286.365, "r_y2": 171.57100000000003, "r_x3": 50.112, "r_y3": 171.57100000000003, "coord_origin": "TOPLEFT"}, "text": "posed by the community to address table-structure decom-", "orig": "posed by the community to address table-structure decom-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 192.07799999999997, "r_x1": 286.365, "r_y1": 192.07799999999997, "r_x2": 286.365, "r_y2": 183.52599999999995, "r_x3": 50.112, "r_y3": 183.52599999999995, "coord_origin": "TOPLEFT"}, "text": "position [37, 36, 18, 20]. All these models have some weak-", "orig": "position [37, 36, 18, 20]. All these models have some weak-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 204.03300000000002, "r_x1": 114.51, "r_y1": 204.03300000000002, "r_x2": 114.51, "r_y2": 195.481, "r_x3": 50.112, "r_y3": 195.481, "coord_origin": "TOPLEFT"}, "text": "nesses (see Sec.", "orig": "nesses (see Sec.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.163, "r_y0": 204.03300000000002, "r_x1": 129.952, "r_y1": 204.03300000000002, "r_x2": 129.952, "r_y2": 195.481, "r_x3": 119.163, "r_y3": 195.481, "coord_origin": "TOPLEFT"}, "text": "2).", "orig": "2).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.615, "r_y0": 204.03300000000002, "r_x1": 286.365, "r_y1": 204.03300000000002, "r_x2": 286.365, "r_y2": 195.481, "r_x3": 134.615, "r_y3": 195.481, "coord_origin": "TOPLEFT"}, "text": "The common denominator here is the", "orig": "The common denominator here is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 215.98800000000006, "r_x1": 286.365, "r_y1": 215.98800000000006, "r_x2": 286.365, "r_y2": 207.43600000000004, "r_x3": 50.112, "r_y3": 207.43600000000004, "coord_origin": "TOPLEFT"}, "text": "reliance on textual features and/or the inability to provide", "orig": "reliance on textual features and/or the inability to provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 227.94399999999996, "r_x1": 278.664, "r_y1": 227.94399999999996, "r_x2": 278.664, "r_y2": 219.39200000000005, "r_x3": 50.112, "r_y3": 219.39200000000005, "coord_origin": "TOPLEFT"}, "text": "the bounding box of each table-cell in the original image.", "orig": "the bounding box of each table-cell in the original image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The second problem is called table-structure decomposition. The latter is a long standing problem in the community of document understanding [6, 4, 14]. Contrary to the table-location problem, there are no commonly used approaches that can easily be re-purposed to solve this problem. Lately, a set of new model-architectures has been proposed by the community to address table-structure decomposition [37, 36, 18, 20]. All these models have some weaknesses (see Sec. 2). The common denominator here is the reliance on textual features and/or the inability to provide the bounding box of each table-cell in the original image."}, {"label": "text", "id": 2, "page_no": 1, "cluster": {"id": 2, "label": "text", "bbox": {"l": 50.112, "t": 231.79999999999995, "r": 286.365, "b": 371.859, "coord_origin": "TOPLEFT"}, "confidence": 0.9855920076370239, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 240.35199999999998, "r_x1": 286.365, "r_y1": 240.35199999999998, "r_x2": 286.365, "r_y2": 231.79999999999995, "r_x3": 62.067, "r_y3": 231.79999999999995, "coord_origin": "TOPLEFT"}, "text": "In this paper, we want to address these weaknesses and", "orig": "In this paper, we want to address these weaknesses and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 252.30700000000002, "r_x1": 78.884, "r_y1": 252.30700000000002, "r_x2": 78.884, "r_y2": 243.755, "r_x3": 50.112, "r_y3": 243.755, "coord_origin": "TOPLEFT"}, "text": "present", "orig": "present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 83.068, "r_y0": 252.30700000000002, "r_x1": 116.373, "r_y1": 252.30700000000002, "r_x2": 116.373, "r_y2": 243.755, "r_x3": 83.068, "r_y3": 243.755, "coord_origin": "TOPLEFT"}, "text": "a robust", "orig": "a robust", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 120.558, "r_y0": 252.30700000000002, "r_x1": 178.102, "r_y1": 252.30700000000002, "r_x2": 178.102, "r_y2": 243.755, "r_x3": 120.558, "r_y3": 243.755, "coord_origin": "TOPLEFT"}, "text": "table-structure", "orig": "table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.276, "r_y0": 252.30700000000002, "r_x1": 286.365, "r_y1": 252.30700000000002, "r_x2": 286.365, "r_y2": 243.755, "r_x3": 182.276, "r_y3": 243.755, "coord_origin": "TOPLEFT"}, "text": "decomposition algorithm.", "orig": "decomposition algorithm.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 264.26199999999994, "r_x1": 260.432, "r_y1": 264.26199999999994, "r_x2": 260.432, "r_y2": 255.71000000000004, "r_x3": 50.112, "r_y3": 255.71000000000004, "coord_origin": "TOPLEFT"}, "text": "The design criteria for our model are the following.", "orig": "The design criteria for our model are the following.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.603, "r_y0": 264.26199999999994, "r_x1": 286.365, "r_y1": 264.26199999999994, "r_x2": 286.365, "r_y2": 255.71000000000004, "r_x3": 265.603, "r_y3": 255.71000000000004, "coord_origin": "TOPLEFT"}, "text": "First,", "orig": "First,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 276.217, "r_x1": 286.365, "r_y1": 276.217, "r_x2": 286.365, "r_y2": 267.66499999999996, "r_x3": 50.112, "r_y3": 267.66499999999996, "coord_origin": "TOPLEFT"}, "text": "we want our algorithm to be language agnostic. In this way,", "orig": "we want our algorithm to be language agnostic. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 288.172, "r_x1": 286.365, "r_y1": 288.172, "r_x2": 286.365, "r_y2": 279.62, "r_x3": 50.112, "r_y3": 279.62, "coord_origin": "TOPLEFT"}, "text": "we can obtain the structure of any table, irregardless of the", "orig": "we can obtain the structure of any table, irregardless of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 300.128, "r_x1": 88.568, "r_y1": 300.128, "r_x2": 88.568, "r_y2": 291.576, "r_x3": 50.112, "r_y3": 291.576, "coord_origin": "TOPLEFT"}, "text": "language.", "orig": "language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 95.502, "r_y0": 300.128, "r_x1": 286.365, "r_y1": 300.128, "r_x2": 286.365, "r_y2": 291.576, "r_x3": 95.502, "r_y3": 291.576, "coord_origin": "TOPLEFT"}, "text": "Second, we want our algorithm to leverage as", "orig": "Second, we want our algorithm to leverage as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 312.083, "r_x1": 286.365, "r_y1": 312.083, "r_x2": 286.365, "r_y2": 303.531, "r_x3": 50.112, "r_y3": 303.531, "coord_origin": "TOPLEFT"}, "text": "much data as possible from the original PDF document. For", "orig": "much data as possible from the original PDF document. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 324.038, "r_x1": 286.365, "r_y1": 324.038, "r_x2": 286.365, "r_y2": 315.486, "r_x3": 50.112, "r_y3": 315.486, "coord_origin": "TOPLEFT"}, "text": "programmatic PDF documents, the text-cells can often be", "orig": "programmatic PDF documents, the text-cells can often be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 335.993, "r_x1": 286.365, "r_y1": 335.993, "r_x2": 286.365, "r_y2": 327.441, "r_x3": 50.112, "r_y3": 327.441, "coord_origin": "TOPLEFT"}, "text": "extracted much faster and with higher accuracy compared", "orig": "extracted much faster and with higher accuracy compared", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 347.948, "r_x1": 286.365, "r_y1": 347.948, "r_x2": 286.365, "r_y2": 339.396, "r_x3": 50.112, "r_y3": 339.396, "coord_origin": "TOPLEFT"}, "text": "to OCR methods. Last but not least, we want to have a di-", "orig": "to OCR methods. Last but not least, we want to have a di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 359.904, "r_x1": 286.365, "r_y1": 359.904, "r_x2": 286.365, "r_y2": 351.352, "r_x3": 50.112, "r_y3": 351.352, "coord_origin": "TOPLEFT"}, "text": "rect link between the table-cell and its bounding box in the", "orig": "rect link between the table-cell and its bounding box in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 371.859, "r_x1": 76.951, "r_y1": 371.859, "r_x2": 76.951, "r_y2": 363.307, "r_x3": 50.112, "r_y3": 363.307, "coord_origin": "TOPLEFT"}, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In this paper, we want to address these weaknesses and present a robust table-structure decomposition algorithm. The design criteria for our model are the following. First, we want our algorithm to be language agnostic. In this way, we can obtain the structure of any table, irregardless of the language. Second, we want our algorithm to leverage as much data as possible from the original PDF document. For programmatic PDF documents, the text-cells can often be extracted much faster and with higher accuracy compared to OCR methods. Last but not least, we want to have a direct link between the table-cell and its bounding box in the image."}, {"label": "text", "id": 7, "page_no": 1, "cluster": {"id": 7, "label": "text", "bbox": {"l": 50.112, "t": 375.715, "r": 286.367, "b": 432.087, "coord_origin": "TOPLEFT"}, "confidence": 0.9820111393928528, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 384.267, "r_x1": 286.365, "r_y1": 384.267, "r_x2": 286.365, "r_y2": 375.715, "r_x3": 62.067, "r_y3": 375.715, "coord_origin": "TOPLEFT"}, "text": "To meet the design criteria listed above, we developed a", "orig": "To meet the design criteria listed above, we developed a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 396.222, "r_x1": 120.986, "r_y1": 396.222, "r_x2": 120.986, "r_y2": 387.67, "r_x3": 50.112, "r_y3": 387.67, "coord_origin": "TOPLEFT"}, "text": "new model called", "orig": "new model called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 123.901, "r_y0": 396.238, "r_x1": 179.731, "r_y1": 396.238, "r_x2": 179.731, "r_y2": 387.282, "r_x3": 123.901, "r_y3": 387.282, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.646, "r_y0": 396.222, "r_x1": 286.367, "r_y1": 396.222, "r_x2": 286.367, "r_y2": 387.67, "r_x3": 182.646, "r_y3": 387.67, "coord_origin": "TOPLEFT"}, "text": "and a synthetically gener-", "orig": "and a synthetically gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 408.177, "r_x1": 181.758, "r_y1": 408.177, "r_x2": 181.758, "r_y2": 399.625, "r_x3": 50.112, "r_y3": 399.625, "coord_origin": "TOPLEFT"}, "text": "ated table structure dataset called", "orig": "ated table structure dataset called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.104, "r_y0": 408.193, "r_x1": 240.203, "r_y1": 408.193, "r_x2": 240.203, "r_y2": 399.237, "r_x3": 184.104, "r_y3": 399.237, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.204, "r_y0": 403.942, "r_x1": 243.691, "r_y1": 403.942, "r_x2": 243.691, "r_y2": 397.956, "r_x3": 240.204, "r_y3": 397.956, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 244.189, "r_y0": 408.177, "r_x1": 246.68, "r_y1": 408.177, "r_x2": 246.68, "r_y2": 399.625, "r_x3": 244.189, "r_y3": 399.625, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.718, "r_y0": 408.177, "r_x1": 286.361, "r_y1": 408.177, "r_x2": 286.361, "r_y2": 399.625, "r_x3": 249.718, "r_y3": 399.625, "coord_origin": "TOPLEFT"}, "text": "In partic-", "orig": "In partic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 420.132, "r_x1": 67.696, "r_y1": 420.132, "r_x2": 67.696, "r_y2": 411.58, "r_x3": 50.112, "r_y3": 411.58, "coord_origin": "TOPLEFT"}, "text": "ular,", "orig": "ular,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 71.322, "r_y0": 420.132, "r_x1": 286.365, "r_y1": 420.132, "r_x2": 286.365, "r_y2": 411.58, "r_x3": 71.322, "r_y3": 411.58, "coord_origin": "TOPLEFT"}, "text": "our contributions in this work can be summarised as", "orig": "our contributions in this work can be summarised as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 432.087, "r_x1": 82.52, "r_y1": 432.087, "r_x2": 82.52, "r_y2": 423.535, "r_x3": 50.112, "r_y3": 423.535, "coord_origin": "TOPLEFT"}, "text": "follows:", "orig": "follows:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "To meet the design criteria listed above, we developed a new model called TableFormer and a synthetically generated table structure dataset called SynthTabNet 1 . In particular, our contributions in this work can be summarised as follows:"}, {"label": "list_item", "id": 6, "page_no": 1, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 61.569, "t": 444.432, "r": 286.365, "b": 489.237, "coord_origin": "TOPLEFT"}, "confidence": 0.9822162389755249, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 453.372, "r_x1": 65.056, "r_y1": 453.372, "r_x2": 65.056, "r_y2": 444.82, "r_x3": 61.569, "r_y3": 444.82, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 453.372, "r_x1": 117.101, "r_y1": 453.372, "r_x2": 117.101, "r_y2": 444.82, "r_x3": 70.037, "r_y3": 444.82, "coord_origin": "TOPLEFT"}, "text": "We propose", "orig": "We propose", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.59, "r_y0": 453.388, "r_x1": 175.42, "r_y1": 453.388, "r_x2": 175.42, "r_y2": 444.432, "r_x3": 119.59, "r_y3": 444.432, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.421, "r_y0": 453.372, "r_x1": 286.365, "r_y1": 453.372, "r_x2": 286.365, "r_y2": 444.82, "r_x3": 175.421, "r_y3": 444.82, "coord_origin": "TOPLEFT"}, "text": ", a transformer based model", "orig": ", a transformer based model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 465.327, "r_x1": 286.365, "r_y1": 465.327, "r_x2": 286.365, "r_y2": 456.775, "r_x3": 70.037, "r_y3": 456.775, "coord_origin": "TOPLEFT"}, "text": "that predicts tables structure and bounding boxes for", "orig": "that predicts tables structure and bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 477.282, "r_x1": 286.365, "r_y1": 477.282, "r_x2": 286.365, "r_y2": 468.73, "r_x3": 70.037, "r_y3": 468.73, "coord_origin": "TOPLEFT"}, "text": "the table content simultaneously in an end-to-end ap-", "orig": "the table content simultaneously in an end-to-end ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 489.237, "r_x1": 99.636, "r_y1": 489.237, "r_x2": 99.636, "r_y2": 480.685, "r_x3": 70.037, "r_y3": 480.685, "coord_origin": "TOPLEFT"}, "text": "proach.", "orig": "proach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u00b7 We propose TableFormer , a transformer based model that predicts tables structure and bounding boxes for the table content simultaneously in an end-to-end approach."}, {"label": "list_item", "id": 5, "page_no": 1, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 61.569, "t": 502.034, "r": 286.365, "b": 546.84, "coord_origin": "TOPLEFT"}, "confidence": 0.982271671295166, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 510.974, "r_x1": 65.056, "r_y1": 510.974, "r_x2": 65.056, "r_y2": 502.422, "r_x3": 61.569, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 510.974, "r_x1": 111.88, "r_y1": 510.974, "r_x2": 111.88, "r_y2": 502.422, "r_x3": 70.037, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "Across all", "orig": "Across all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.084, "r_y0": 510.974, "r_x1": 196.104, "r_y1": 510.974, "r_x2": 196.104, "r_y2": 502.422, "r_x3": 116.084, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "benchmark datasets", "orig": "benchmark datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.31, "r_y0": 510.99, "r_x1": 256.14, "r_y1": 510.99, "r_x2": 256.14, "r_y2": 502.034, "r_x3": 200.31, "r_y3": 502.034, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 260.35, "r_y0": 510.974, "r_x1": 286.362, "r_y1": 510.974, "r_x2": 286.362, "r_y2": 502.422, "r_x3": 260.35, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "signif-", "orig": "signif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 522.929, "r_x1": 97.155, "r_y1": 522.929, "r_x2": 97.155, "r_y2": 514.377, "r_x3": 70.037, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "icantly", "orig": "icantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.678, "r_y0": 522.929, "r_x1": 150.375, "r_y1": 522.929, "r_x2": 150.375, "r_y2": 514.377, "r_x3": 101.678, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "outperforms", "orig": "outperforms", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.898, "r_y0": 522.929, "r_x1": 186.301, "r_y1": 522.929, "r_x2": 186.301, "r_y2": 514.377, "r_x3": 154.898, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "existing", "orig": "existing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 190.824, "r_y0": 522.929, "r_x1": 250.021, "r_y1": 522.929, "r_x2": 250.021, "r_y2": 514.377, "r_x3": 190.824, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "state-of-the-art", "orig": "state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 254.544, "r_y0": 522.929, "r_x1": 286.365, "r_y1": 522.929, "r_x2": 286.365, "r_y2": 514.377, "r_x3": 254.544, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "metrics,", "orig": "metrics,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 534.885, "r_x1": 286.365, "r_y1": 534.885, "r_x2": 286.365, "r_y2": 526.3330000000001, "r_x3": 70.037, "r_y3": 526.3330000000001, "coord_origin": "TOPLEFT"}, "text": "while being much more efficient in training and infer-", "orig": "while being much more efficient in training and infer-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 546.84, "r_x1": 161.653, "r_y1": 546.84, "r_x2": 161.653, "r_y2": 538.288, "r_x3": 70.037, "r_y3": 538.288, "coord_origin": "TOPLEFT"}, "text": "ence to existing works.", "orig": "ence to existing works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u00b7 Across all benchmark datasets TableFormer significantly outperforms existing state-of-the-art metrics, while being much more efficient in training and inference to existing works."}, {"label": "list_item", "id": 9, "page_no": 1, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 61.569, "t": 559.637, "r": 286.365, "b": 592.487, "coord_origin": "TOPLEFT"}, "confidence": 0.9802963733673096, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 568.577, "r_x1": 65.056, "r_y1": 568.577, "r_x2": 65.056, "r_y2": 560.025, "r_x3": 61.569, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 568.577, "r_x1": 116.712, "r_y1": 568.577, "r_x2": 116.712, "r_y2": 560.025, "r_x3": 70.037, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "We present", "orig": "We present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 121.583, "r_y0": 568.593, "r_x1": 177.682, "r_y1": 568.593, "r_x2": 177.682, "r_y2": 559.637, "r_x3": 121.583, "r_y3": 559.637, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.553, "r_y0": 568.577, "r_x1": 186.976, "r_y1": 568.577, "r_x2": 186.976, "r_y2": 560.025, "r_x3": 182.553, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 191.848, "r_y0": 568.577, "r_x1": 242.767, "r_y1": 568.577, "r_x2": 242.767, "r_y2": 560.025, "r_x3": 191.848, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "synthetically", "orig": "synthetically", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.639, "r_y0": 568.577, "r_x1": 286.363, "r_y1": 568.577, "r_x2": 286.363, "r_y2": 560.025, "r_x3": 247.639, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "generated", "orig": "generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 580.532, "r_x1": 286.365, "r_y1": 580.532, "r_x2": 286.365, "r_y2": 571.98, "r_x3": 70.037, "r_y3": 571.98, "coord_origin": "TOPLEFT"}, "text": "dataset, with various appearance styles and complex-", "orig": "dataset, with various appearance styles and complex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 592.487, "r_x1": 82.401, "r_y1": 592.487, "r_x2": 82.401, "r_y2": 583.935, "r_x3": 70.037, "r_y3": 583.935, "coord_origin": "TOPLEFT"}, "text": "ity.", "orig": "ity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u00b7 We present SynthTabNet a synthetically generated dataset, with various appearance styles and complexity."}, {"label": "list_item", "id": 8, "page_no": 1, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 61.569, "t": 605.672, "r": 286.365, "b": 638.135, "coord_origin": "TOPLEFT"}, "confidence": 0.9806395173072815, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 614.2239999999999, "r_x1": 65.056, "r_y1": 614.2239999999999, "r_x2": 65.056, "r_y2": 605.672, "r_x3": 61.569, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 614.2239999999999, "r_x1": 132.005, "r_y1": 614.2239999999999, "r_x2": 132.005, "r_y2": 605.672, "r_x3": 70.037, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "An augmented", "orig": "An augmented", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.082, "r_y0": 614.2239999999999, "r_x1": 165.748, "r_y1": 614.2239999999999, "r_x2": 165.748, "r_y2": 605.672, "r_x3": 138.082, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "dataset", "orig": "dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.815, "r_y0": 614.2239999999999, "r_x1": 194.5, "r_y1": 614.2239999999999, "r_x2": 194.5, "r_y2": 605.672, "r_x3": 171.815, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "based", "orig": "based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.577, "r_y0": 614.2239999999999, "r_x1": 210.54, "r_y1": 614.2239999999999, "r_x2": 210.54, "r_y2": 605.672, "r_x3": 200.577, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "on", "orig": "on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.617, "r_y0": 614.2239999999999, "r_x1": 261.2, "r_y1": 614.2239999999999, "r_x2": 261.2, "r_y2": 605.672, "r_x3": 216.617, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 267.277, "r_y0": 614.2239999999999, "r_x1": 286.365, "r_y1": 614.2239999999999, "r_x2": 286.365, "r_y2": 605.672, "r_x3": 267.277, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "[37],", "orig": "[37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 626.179, "r_x1": 135.521, "r_y1": 626.179, "r_x2": 135.521, "r_y2": 617.627, "r_x3": 70.037, "r_y3": 617.627, "coord_origin": "TOPLEFT"}, "text": "FinTabNet [36],", "orig": "FinTabNet [36],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.925, "r_y0": 626.179, "r_x1": 286.365, "r_y1": 626.179, "r_x2": 286.365, "r_y2": 617.627, "r_x3": 139.925, "r_y3": 617.627, "coord_origin": "TOPLEFT"}, "text": "and TableBank [17] with generated", "orig": "and TableBank [17] with generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 638.135, "r_x1": 198.056, "r_y1": 638.135, "r_x2": 198.056, "r_y2": 629.583, "r_x3": 70.037, "r_y3": 629.583, "coord_origin": "TOPLEFT"}, "text": "ground-truth for reproducibility.", "orig": "ground-truth for reproducibility.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u00b7 An augmented dataset based on PubTabNet [37], FinTabNet [36], and TableBank [17] with generated ground-truth for reproducibility."}, {"label": "text", "id": 11, "page_no": 1, "cluster": {"id": 11, "label": "text", "bbox": {"l": 50.112, "t": 650.867, "r": 286.365, "b": 695.284, "coord_origin": "TOPLEFT"}, "confidence": 0.9742533564567566, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 659.419, "r_x1": 204.452, "r_y1": 659.419, "r_x2": 204.452, "r_y2": 650.867, "r_x3": 62.067, "r_y3": 650.867, "coord_origin": "TOPLEFT"}, "text": "The paper is structured as follows.", "orig": "The paper is structured as follows.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.789, "r_y0": 659.419, "r_x1": 286.365, "r_y1": 659.419, "r_x2": 286.365, "r_y2": 650.867, "r_x3": 210.789, "r_y3": 650.867, "coord_origin": "TOPLEFT"}, "text": "In Sec. 2, we give", "orig": "In Sec. 2, we give", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 671.374, "r_x1": 240.896, "r_y1": 671.374, "r_x2": 240.896, "r_y2": 662.822, "r_x3": 50.112, "r_y3": 662.822, "coord_origin": "TOPLEFT"}, "text": "a brief overview of the current state-of-the-art.", "orig": "a brief overview of the current state-of-the-art.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.833, "r_y0": 671.374, "r_x1": 286.365, "r_y1": 671.374, "r_x2": 286.365, "r_y2": 662.822, "r_x3": 246.833, "r_y3": 662.822, "coord_origin": "TOPLEFT"}, "text": "In Sec. 3,", "orig": "In Sec. 3,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 683.329, "r_x1": 227.396, "r_y1": 683.329, "r_x2": 227.396, "r_y2": 674.777, "r_x3": 50.112, "r_y3": 674.777, "coord_origin": "TOPLEFT"}, "text": "we describe the datasets on which we train.", "orig": "we describe the datasets on which we train.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.467, "r_y0": 683.329, "r_x1": 286.365, "r_y1": 683.329, "r_x2": 286.365, "r_y2": 674.777, "r_x3": 232.467, "r_y3": 674.777, "coord_origin": "TOPLEFT"}, "text": "In Sec. 4, we", "orig": "In Sec. 4, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 695.284, "r_x1": 286.365, "r_y1": 695.284, "r_x2": 286.365, "r_y2": 686.732, "r_x3": 50.112, "r_y3": 686.732, "coord_origin": "TOPLEFT"}, "text": "introduce the TableFormer model-architecture and describe", "orig": "introduce the TableFormer model-architecture and describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The paper is structured as follows. In Sec. 2, we give a brief overview of the current state-of-the-art. In Sec. 3, we describe the datasets on which we train. In Sec. 4, we introduce the TableFormer model-architecture and describe"}, {"label": "footnote", "id": 14, "page_no": 1, "cluster": {"id": 14, "label": "footnote", "bbox": {"l": 60.971, "t": 704.296, "r": 183.731, "b": 712.653, "coord_origin": "TOPLEFT"}, "confidence": 0.895367443561554, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.971, "r_y0": 709.427, "r_x1": 63.96, "r_y1": 709.427, "r_x2": 63.96, "r_y2": 704.296, "r_x3": 60.971, "r_y3": 704.296, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 64.458, "r_y0": 712.653, "r_x1": 183.731, "r_y1": 712.653, "r_x2": 183.731, "r_y2": 705.811, "r_x3": 64.458, "r_y3": 705.811, "coord_origin": "TOPLEFT"}, "text": "https://github.com/IBM/SynthTabNet", "orig": "https://github.com/IBM/SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1 https://github.com/IBM/SynthTabNet"}, {"label": "text", "id": 10, "page_no": 1, "cluster": {"id": 10, "label": "text", "bbox": {"l": 308.862, "t": 75.47699999999998, "r": 545.115, "b": 107.93899999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9774322509765625, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 545.115, "r_y1": 84.029, "r_x2": 545.115, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "its results &performance in Sec. 5. As a conclusion, we de-", "orig": "its results &performance in Sec. 5. As a conclusion, we de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 95.98400000000004, "r_x1": 545.115, "r_y1": 95.98400000000004, "r_x2": 545.115, "r_y2": 87.43200000000002, "r_x3": 308.862, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "scribe how this new model-architecture can be re-purposed", "orig": "scribe how this new model-architecture can be re-purposed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 107.93899999999996, "r_x1": 508.084, "r_y1": 107.93899999999996, "r_x2": 508.084, "r_y2": 99.38699999999994, "r_x3": 308.862, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "for other tasks in the computer-vision community.", "orig": "for other tasks in the computer-vision community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "its results &performance in Sec. 5. As a conclusion, we describe how this new model-architecture can be re-purposed for other tasks in the computer-vision community."}, {"label": "section_header", "id": 13, "page_no": 1, "cluster": {"id": 13, "label": "section_header", "bbox": {"l": 308.862, "t": 121.73199999999997, "r": 498.28, "b": 132.48000000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9428724646568298, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 132.48000000000002, "r_x1": 498.28, "r_y1": 132.48000000000002, "r_x2": 498.28, "r_y2": 121.73199999999997, "r_x3": 308.862, "r_y3": 121.73199999999997, "coord_origin": "TOPLEFT"}, "text": "2. Previous work and State of the Art", "orig": "2. Previous work and State of the Art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2. Previous work and State of the Art"}, {"label": "text", "id": 0, "page_no": 1, "cluster": {"id": 0, "label": "text", "bbox": {"l": 308.862, "t": 142.49, "r": 545.115, "b": 330.369, "coord_origin": "TOPLEFT"}, "confidence": 0.987194836139679, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 151.04200000000003, "r_x1": 545.115, "r_y1": 151.04200000000003, "r_x2": 545.115, "r_y2": 142.49, "r_x3": 320.817, "r_y3": 142.49, "coord_origin": "TOPLEFT"}, "text": "Identifying the structure of a table has been an outstand-", "orig": "Identifying the structure of a table has been an outstand-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 162.99699999999996, "r_x1": 545.115, "r_y1": 162.99699999999996, "r_x2": 545.115, "r_y2": 154.44500000000005, "r_x3": 308.862, "r_y3": 154.44500000000005, "coord_origin": "TOPLEFT"}, "text": "ing problem in the document-parsing community, that mo-", "orig": "ing problem in the document-parsing community, that mo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 174.952, "r_x1": 334.376, "r_y1": 174.952, "r_x2": 334.376, "r_y2": 166.39999999999998, "r_x3": 308.862, "r_y3": 166.39999999999998, "coord_origin": "TOPLEFT"}, "text": "tivates", "orig": "tivates", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.192, "r_y0": 174.952, "r_x1": 522.56, "r_y1": 174.952, "r_x2": 522.56, "r_y2": 166.39999999999998, "r_x3": 338.192, "r_y3": 166.39999999999998, "coord_origin": "TOPLEFT"}, "text": "many organised public challenges [6, 4, 14].", "orig": "many organised public challenges [6, 4, 14].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 529.623, "r_y0": 174.952, "r_x1": 545.115, "r_y1": 174.952, "r_x2": 545.115, "r_y2": 166.39999999999998, "r_x3": 529.623, "r_y3": 166.39999999999998, "coord_origin": "TOPLEFT"}, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 186.90700000000004, "r_x1": 545.115, "r_y1": 186.90700000000004, "r_x2": 545.115, "r_y2": 178.35500000000002, "r_x3": 308.862, "r_y3": 178.35500000000002, "coord_origin": "TOPLEFT"}, "text": "difficulty of the problem can be attributed to a number of", "orig": "difficulty of the problem can be attributed to a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 198.86199999999997, "r_x1": 545.115, "r_y1": 198.86199999999997, "r_x2": 545.115, "r_y2": 190.30999999999995, "r_x3": 308.862, "r_y3": 190.30999999999995, "coord_origin": "TOPLEFT"}, "text": "factors. First, there is a large variety in the shapes and sizes", "orig": "factors. First, there is a large variety in the shapes and sizes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 210.817, "r_x1": 346.979, "r_y1": 210.817, "r_x2": 346.979, "r_y2": 202.265, "r_x3": 308.862, "r_y3": 202.265, "coord_origin": "TOPLEFT"}, "text": "of tables.", "orig": "of tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.869, "r_y0": 210.817, "r_x1": 508.642, "r_y1": 210.817, "r_x2": 508.642, "r_y2": 202.265, "r_x3": 354.869, "r_y3": 202.265, "coord_origin": "TOPLEFT"}, "text": "Such large variety requires a flexible", "orig": "Such large variety requires a flexible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.737, "r_y0": 210.817, "r_x1": 545.115, "r_y1": 210.817, "r_x2": 545.115, "r_y2": 202.265, "r_x3": 512.737, "r_y3": 202.265, "coord_origin": "TOPLEFT"}, "text": "method.", "orig": "method.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 222.77300000000002, "r_x1": 545.115, "r_y1": 222.77300000000002, "r_x2": 545.115, "r_y2": 214.221, "r_x3": 308.862, "r_y3": 214.221, "coord_origin": "TOPLEFT"}, "text": "This is especially true for complex column- and row head-", "orig": "This is especially true for complex column- and row head-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 234.72799999999995, "r_x1": 322.969, "r_y1": 234.72799999999995, "r_x2": 322.969, "r_y2": 226.17600000000004, "r_x3": 308.862, "r_y3": 226.17600000000004, "coord_origin": "TOPLEFT"}, "text": "ers,", "orig": "ers,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.084, "r_y0": 234.72799999999995, "r_x1": 530.918, "r_y1": 234.72799999999995, "r_x2": 530.918, "r_y2": 226.17600000000004, "r_x3": 327.084, "r_y3": 226.17600000000004, "coord_origin": "TOPLEFT"}, "text": "which can be extremely intricate and demanding.", "orig": "which can be extremely intricate and demanding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 537.922, "r_y0": 234.72799999999995, "r_x1": 545.115, "r_y1": 234.72799999999995, "r_x2": 545.115, "r_y2": 226.17600000000004, "r_x3": 537.922, "r_y3": 226.17600000000004, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 246.683, "r_x1": 545.115, "r_y1": 246.683, "r_x2": 545.115, "r_y2": 238.13099999999997, "r_x3": 308.862, "r_y3": 238.13099999999997, "coord_origin": "TOPLEFT"}, "text": "second factor of complexity is the lack of data with regard", "orig": "second factor of complexity is the lack of data with regard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.63800000000003, "r_x1": 545.115, "r_y1": 258.63800000000003, "r_x2": 545.115, "r_y2": 250.086, "r_x3": 308.862, "r_y3": 250.086, "coord_origin": "TOPLEFT"}, "text": "to table-structure. Until the publication of PubTabNet [37],", "orig": "to table-structure. Until the publication of PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 270.59299999999996, "r_x1": 439.84, "r_y1": 270.59299999999996, "r_x2": 439.84, "r_y2": 262.04100000000005, "r_x3": 308.862, "r_y3": 262.04100000000005, "coord_origin": "TOPLEFT"}, "text": "there were no large datasets (i.e.", "orig": "there were no large datasets (i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 444.44, "r_y0": 270.429, "r_x1": 452.189, "r_y1": 270.429, "r_x2": 452.189, "r_y2": 261.72299999999996, "r_x3": 444.44, "r_y3": 261.72299999999996, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.89, "r_y0": 270.429, "r_x1": 470.834, "r_y1": 270.429, "r_x2": 470.834, "r_y2": 261.72299999999996, "r_x3": 455.89, "r_y3": 261.72299999999996, "coord_origin": "TOPLEFT"}, "text": "100", "orig": "100", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 470.834, "r_y0": 270.59299999999996, "r_x1": 545.115, "r_y1": 270.59299999999996, "r_x2": 545.115, "r_y2": 262.04100000000005, "r_x3": 470.834, "r_y3": 262.04100000000005, "coord_origin": "TOPLEFT"}, "text": "K tables) that pro-", "orig": "K tables) that pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 282.548, "r_x1": 545.115, "r_y1": 282.548, "r_x2": 545.115, "r_y2": 273.996, "r_x3": 308.862, "r_y3": 273.996, "coord_origin": "TOPLEFT"}, "text": "vided structure information. This happens primarily due to", "orig": "vided structure information. This happens primarily due to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 294.504, "r_x1": 545.115, "r_y1": 294.504, "r_x2": 545.115, "r_y2": 285.952, "r_x3": 308.862, "r_y3": 285.952, "coord_origin": "TOPLEFT"}, "text": "the fact that tables are notoriously time-consuming to an-", "orig": "the fact that tables are notoriously time-consuming to an-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 306.459, "r_x1": 545.115, "r_y1": 306.459, "r_x2": 545.115, "r_y2": 297.907, "r_x3": 308.862, "r_y3": 297.907, "coord_origin": "TOPLEFT"}, "text": "notate by hand. However, this has definitely changed in re-", "orig": "notate by hand. However, this has definitely changed in re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 318.414, "r_x1": 545.115, "r_y1": 318.414, "r_x2": 545.115, "r_y2": 309.862, "r_x3": 308.862, "r_y3": 309.862, "coord_origin": "TOPLEFT"}, "text": "cent years with the deliverance of PubTabNet [37], FinTab-", "orig": "cent years with the deliverance of PubTabNet [37], FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 330.369, "r_x1": 425.923, "r_y1": 330.369, "r_x2": 425.923, "r_y2": 321.817, "r_x3": 308.862, "r_y3": 321.817, "coord_origin": "TOPLEFT"}, "text": "Net [36], TableBank [17] etc.", "orig": "Net [36], TableBank [17] etc.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Identifying the structure of a table has been an outstanding problem in the document-parsing community, that motivates many organised public challenges [6, 4, 14]. The difficulty of the problem can be attributed to a number of factors. First, there is a large variety in the shapes and sizes of tables. Such large variety requires a flexible method. This is especially true for complex column- and row headers, which can be extremely intricate and demanding. A second factor of complexity is the lack of data with regard to table-structure. Until the publication of PubTabNet [37], there were no large datasets (i.e. > 100 K tables) that provided structure information. This happens primarily due to the fact that tables are notoriously time-consuming to annotate by hand. However, this has definitely changed in recent years with the deliverance of PubTabNet [37], FinTabNet [36], TableBank [17] etc."}, {"label": "text", "id": 1, "page_no": 1, "cluster": {"id": 1, "label": "text", "bbox": {"l": 308.862, "t": 333.838, "r": 545.115, "b": 449.987, "coord_origin": "TOPLEFT"}, "confidence": 0.9869040250778198, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 342.39, "r_x1": 391.492, "r_y1": 342.39, "r_x2": 391.492, "r_y2": 333.838, "r_x3": 320.817, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "Before the rising", "orig": "Before the rising", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.845, "r_y0": 342.39, "r_x1": 436.802, "r_y1": 342.39, "r_x2": 436.802, "r_y2": 333.838, "r_x3": 395.845, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "popularity", "orig": "popularity", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.145, "r_y0": 342.39, "r_x1": 449.444, "r_y1": 342.39, "r_x2": 449.444, "r_y2": 333.838, "r_x3": 441.145, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.798, "r_y0": 342.39, "r_x1": 545.115, "r_y1": 342.39, "r_x2": 545.115, "r_y2": 333.838, "r_x3": 453.798, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "deep neural networks,", "orig": "deep neural networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 354.345, "r_x1": 545.115, "r_y1": 354.345, "r_x2": 545.115, "r_y2": 345.793, "r_x3": 308.862, "r_y3": 345.793, "coord_origin": "TOPLEFT"}, "text": "the community relied heavily on heuristic and/or statistical", "orig": "the community relied heavily on heuristic and/or statistical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 366.3, "r_x1": 545.115, "r_y1": 366.3, "r_x2": 545.115, "r_y2": 357.748, "r_x3": 308.862, "r_y3": 357.748, "coord_origin": "TOPLEFT"}, "text": "methods to do table structure identification [3, 7, 11, 5, 13,", "orig": "methods to do table structure identification [3, 7, 11, 5, 13,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 378.256, "r_x1": 324.633, "r_y1": 378.256, "r_x2": 324.633, "r_y2": 369.704, "r_x3": 308.862, "r_y3": 369.704, "coord_origin": "TOPLEFT"}, "text": "28].", "orig": "28].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 329.634, "r_y0": 378.256, "r_x1": 545.115, "r_y1": 378.256, "r_x2": 545.115, "r_y2": 369.704, "r_x3": 329.634, "r_y3": 369.704, "coord_origin": "TOPLEFT"}, "text": "Although such methods work well on constrained ta-", "orig": "Although such methods work well on constrained ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 390.211, "r_x1": 545.115, "r_y1": 390.211, "r_x2": 545.115, "r_y2": 381.659, "r_x3": 308.862, "r_y3": 381.659, "coord_origin": "TOPLEFT"}, "text": "bles [12], a more data-driven approach can be applied due", "orig": "bles [12], a more data-driven approach can be applied due", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 402.166, "r_x1": 545.115, "r_y1": 402.166, "r_x2": 545.115, "r_y2": 393.614, "r_x3": 308.862, "r_y3": 393.614, "coord_origin": "TOPLEFT"}, "text": "to the advent of convolutional neural networks (CNNs) and", "orig": "to the advent of convolutional neural networks (CNNs) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 414.121, "r_x1": 438.416, "r_y1": 414.121, "r_x2": 438.416, "r_y2": 405.569, "r_x3": 308.862, "r_y3": 405.569, "coord_origin": "TOPLEFT"}, "text": "the availability of large datasets.", "orig": "the availability of large datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.231, "r_y0": 414.121, "r_x1": 545.115, "r_y1": 414.121, "r_x2": 545.115, "r_y2": 405.569, "r_x3": 442.231, "r_y3": 405.569, "coord_origin": "TOPLEFT"}, "text": "To the best-of-our knowl-", "orig": "To the best-of-our knowl-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 426.076, "r_x1": 545.115, "r_y1": 426.076, "r_x2": 545.115, "r_y2": 417.524, "r_x3": 308.862, "r_y3": 417.524, "coord_origin": "TOPLEFT"}, "text": "edge, there are currently two different types of network ar-", "orig": "edge, there are currently two different types of network ar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 438.032, "r_x1": 545.115, "r_y1": 438.032, "r_x2": 545.115, "r_y2": 429.48, "r_x3": 308.862, "r_y3": 429.48, "coord_origin": "TOPLEFT"}, "text": "chitecture that are being pursued for state-of-the-art table-", "orig": "chitecture that are being pursued for state-of-the-art table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 449.987, "r_x1": 401.285, "r_y1": 449.987, "r_x2": 401.285, "r_y2": 441.435, "r_x3": 308.862, "r_y3": 441.435, "coord_origin": "TOPLEFT"}, "text": "structure identification.", "orig": "structure identification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Before the rising popularity of deep neural networks, the community relied heavily on heuristic and/or statistical methods to do table structure identification [3, 7, 11, 5, 13, 28]. Although such methods work well on constrained tables [12], a more data-driven approach can be applied due to the advent of convolutional neural networks (CNNs) and the availability of large datasets. To the best-of-our knowledge, there are currently two different types of network architecture that are being pursued for state-of-the-art tablestructure identification."}, {"label": "text", "id": 3, "page_no": 1, "cluster": {"id": 3, "label": "text", "bbox": {"l": 308.862, "t": 453.068, "r": 545.117, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9843218326568604, "cells": [{"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 462.024, "r_x1": 423.262, "r_y1": 462.024, "r_x2": 423.262, "r_y2": 453.068, "r_x3": 320.817, "r_y3": 453.068, "coord_origin": "TOPLEFT"}, "text": "Image-to-Text networks", "orig": "Image-to-Text networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.267, "r_y0": 462.008, "r_x1": 426.037, "r_y1": 462.008, "r_x2": 426.037, "r_y2": 453.456, "r_x3": 423.267, "r_y3": 453.456, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.769, "r_y0": 462.008, "r_x1": 545.11, "r_y1": 462.008, "r_x2": 545.11, "r_y2": 453.456, "r_x3": 430.769, "r_y3": 453.456, "coord_origin": "TOPLEFT"}, "text": "In this type of network, one", "orig": "In this type of network, one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 473.963, "r_x1": 340.404, "r_y1": 473.963, "r_x2": 340.404, "r_y2": 465.411, "r_x3": 308.862, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "predicts", "orig": "predicts", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.116, "r_y0": 473.963, "r_x1": 349.539, "r_y1": 473.963, "r_x2": 349.539, "r_y2": 465.411, "r_x3": 345.116, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.252, "r_y0": 473.963, "r_x1": 390.765, "r_y1": 473.963, "r_x2": 390.765, "r_y2": 465.411, "r_x3": 354.252, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "sequence", "orig": "sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.477, "r_y0": 473.963, "r_x1": 403.776, "r_y1": 473.963, "r_x2": 403.776, "r_y2": 465.411, "r_x3": 395.477, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.488, "r_y0": 473.963, "r_x1": 434.401, "r_y1": 473.963, "r_x2": 434.401, "r_y2": 465.411, "r_x3": 408.488, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.113, "r_y0": 473.963, "r_x1": 469.001, "r_y1": 473.963, "r_x2": 469.001, "r_y2": 465.411, "r_x3": 439.113, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "starting", "orig": "starting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 473.713, "r_y0": 473.963, "r_x1": 545.115, "r_y1": 473.963, "r_x2": 545.115, "r_y2": 465.411, "r_x3": 473.713, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "from an encoded", "orig": "from an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 485.918, "r_x1": 335.701, "r_y1": 485.918, "r_x2": 335.701, "r_y2": 477.366, "r_x3": 308.862, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.853, "r_y0": 485.918, "r_x1": 411.009, "r_y1": 485.918, "r_x2": 411.009, "r_y2": 477.366, "r_x3": 345.853, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "Such sequences", "orig": "Such sequences", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 415.85, "r_y0": 485.918, "r_x1": 424.149, "r_y1": 485.918, "r_x2": 424.149, "r_y2": 477.366, "r_x3": 415.85, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.001, "r_y0": 485.918, "r_x1": 454.914, "r_y1": 485.918, "r_x2": 454.914, "r_y2": 477.366, "r_x3": 429.001, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.756, "r_y0": 485.918, "r_x1": 473.584, "r_y1": 485.918, "r_x2": 473.584, "r_y2": 477.366, "r_x3": 459.756, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "can", "orig": "can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.425, "r_y0": 485.918, "r_x1": 487.83, "r_y1": 485.918, "r_x2": 487.83, "r_y2": 477.366, "r_x3": 478.425, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "be", "orig": "be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 492.682, "r_y0": 485.918, "r_x1": 545.115, "r_y1": 485.918, "r_x2": 545.115, "r_y2": 477.366, "r_x3": 492.682, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "HTML table", "orig": "HTML table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 497.873, "r_x1": 459.218, "r_y1": 497.873, "r_x2": 459.218, "r_y2": 489.321, "r_x3": 308.862, "r_y3": 489.321, "coord_origin": "TOPLEFT"}, "text": "tags [37, 17] or LaTeX symbols[10].", "orig": "tags [37, 17] or LaTeX symbols[10].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.115, "r_y0": 497.873, "r_x1": 545.115, "r_y1": 497.873, "r_x2": 545.115, "r_y2": 489.321, "r_x3": 465.115, "r_y3": 489.321, "coord_origin": "TOPLEFT"}, "text": "The choice of sym-", "orig": "The choice of sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 509.828, "r_x1": 545.115, "r_y1": 509.828, "r_x2": 545.115, "r_y2": 501.276, "r_x3": 308.862, "r_y3": 501.276, "coord_origin": "TOPLEFT"}, "text": "bols is ultimately not very important, since one can be trans-", "orig": "bols is ultimately not very important, since one can be trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 521.784, "r_x1": 396.692, "r_y1": 521.784, "r_x2": 396.692, "r_y2": 513.232, "r_x3": 308.862, "r_y3": 513.232, "coord_origin": "TOPLEFT"}, "text": "formed into the other.", "orig": "formed into the other.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.265, "r_y0": 521.784, "r_x1": 545.115, "r_y1": 521.784, "r_x2": 545.115, "r_y2": 513.232, "r_x3": 401.265, "r_y3": 513.232, "coord_origin": "TOPLEFT"}, "text": "There are however subtle variations", "orig": "There are however subtle variations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.739, "r_x1": 433.484, "r_y1": 533.739, "r_x2": 433.484, "r_y2": 525.187, "r_x3": 308.862, "r_y3": 525.187, "coord_origin": "TOPLEFT"}, "text": "in the Image-to-Text networks.", "orig": "in the Image-to-Text networks.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 438.187, "r_y0": 533.739, "r_x1": 545.115, "r_y1": 533.739, "r_x2": 545.115, "r_y2": 525.187, "r_x3": 438.187, "r_y3": 525.187, "coord_origin": "TOPLEFT"}, "text": "The easiest network archi-", "orig": "The easiest network archi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.694, "r_x1": 420.941, "r_y1": 545.694, "r_x2": 420.941, "r_y2": 537.142, "r_x3": 308.862, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "tectures are 'image-encoder", "orig": "tectures are 'image-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.595, "r_y0": 545.388, "r_x1": 433.558, "r_y1": 545.388, "r_x2": 433.558, "r_y2": 536.8240000000001, "r_x3": 423.595, "r_y3": 536.8240000000001, "coord_origin": "TOPLEFT"}, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.212, "r_y0": 545.694, "r_x1": 545.113, "r_y1": 545.694, "r_x2": 545.113, "r_y2": 537.142, "r_x3": 436.212, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "text-decoder' (IETD), sim-", "orig": "text-decoder' (IETD), sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 557.649, "r_x1": 545.115, "r_y1": 557.649, "r_x2": 545.115, "r_y2": 549.097, "r_x3": 308.862, "r_y3": 549.097, "coord_origin": "TOPLEFT"}, "text": "ilar to network architectures that try to provide captions to", "orig": "ilar to network architectures that try to provide captions to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.604, "r_x1": 545.115, "r_y1": 569.604, "r_x2": 545.115, "r_y2": 561.052, "r_x3": 308.862, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "images [32]. In these IETD networks, one expects as output", "orig": "images [32]. In these IETD networks, one expects as output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 581.559, "r_x1": 503.671, "r_y1": 581.559, "r_x2": 503.671, "r_y2": 573.0070000000001, "r_x3": 308.862, "r_y3": 573.0070000000001, "coord_origin": "TOPLEFT"}, "text": "the LaTeX/HTML string of the entire table, i.e.", "orig": "the LaTeX/HTML string of the entire table, i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 509.579, "r_y0": 581.559, "r_x1": 545.115, "r_y1": 581.559, "r_x2": 545.115, "r_y2": 573.0070000000001, "r_x3": 509.579, "r_y3": 573.0070000000001, "coord_origin": "TOPLEFT"}, "text": "the sym-", "orig": "the sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 593.515, "r_x1": 545.115, "r_y1": 593.515, "r_x2": 545.115, "r_y2": 584.963, "r_x3": 308.862, "r_y3": 584.963, "coord_origin": "TOPLEFT"}, "text": "bols necessary for creating the table with the content of the", "orig": "bols necessary for creating the table with the content of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.47, "r_x1": 330.72, "r_y1": 605.47, "r_x2": 330.72, "r_y2": 596.918, "r_x3": 308.862, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "table.", "orig": "table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.536, "r_y0": 605.47, "r_x1": 497.075, "r_y1": 605.47, "r_x2": 497.075, "r_y2": 596.918, "r_x3": 334.536, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "Another approach is the 'image-encoder", "orig": "Another approach is the 'image-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 499.805, "r_y0": 605.164, "r_x1": 509.768, "r_y1": 605.164, "r_x2": 509.768, "r_y2": 596.6, "r_x3": 499.805, "r_y3": 596.6, "coord_origin": "TOPLEFT"}, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.501, "r_y0": 605.47, "r_x1": 545.109, "r_y1": 605.47, "r_x2": 545.109, "r_y2": 596.918, "r_x3": 512.501, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "dual de-", "orig": "dual de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.425, "r_x1": 545.115, "r_y1": 617.425, "r_x2": 545.115, "r_y2": 608.873, "r_x3": 308.862, "r_y3": 608.873, "coord_origin": "TOPLEFT"}, "text": "coder' (IEDD) networks. In these type of networks, one has", "orig": "coder' (IEDD) networks. In these type of networks, one has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.38, "r_x1": 545.115, "r_y1": 629.38, "r_x2": 545.115, "r_y2": 620.828, "r_x3": 308.862, "r_y3": 620.828, "coord_origin": "TOPLEFT"}, "text": "two consecutive decoders with different purposes. The first", "orig": "two consecutive decoders with different purposes. The first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.335, "r_x1": 364.782, "r_y1": 641.335, "r_x2": 364.782, "r_y2": 632.783, "r_x3": 308.862, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "decoder is the", "orig": "decoder is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.574, "r_y0": 641.192, "r_x1": 415.614, "r_y1": 641.192, "r_x2": 415.614, "r_y2": 632.604, "r_x3": 367.574, "r_y3": 632.604, "coord_origin": "TOPLEFT"}, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 415.613, "r_y0": 641.335, "r_x1": 418.104, "r_y1": 641.335, "r_x2": 418.104, "r_y2": 632.783, "r_x3": 415.613, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 420.963, "r_y0": 641.335, "r_x1": 433.137, "r_y1": 641.335, "r_x2": 433.137, "r_y2": 632.783, "r_x3": 420.963, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "i.e.", "orig": "i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.122, "r_y0": 641.335, "r_x1": 442.661, "r_y1": 641.335, "r_x2": 442.661, "r_y2": 632.783, "r_x3": 437.122, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 445.441, "r_y0": 641.335, "r_x1": 545.117, "r_y1": 641.335, "r_x2": 545.117, "r_y2": 632.783, "r_x3": 445.441, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "only produces the HTM-", "orig": "only produces the HTM-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.29, "r_x1": 545.115, "r_y1": 653.29, "r_x2": 545.115, "r_y2": 644.738, "r_x3": 308.862, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "L/LaTeX tags which construct an empty table. The second", "orig": "L/LaTeX tags which construct an empty table. The second", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 665.103, "r_x1": 373.599, "r_y1": 665.103, "r_x2": 373.599, "r_y2": 656.515, "r_x3": 308.862, "r_y3": 656.515, "coord_origin": "TOPLEFT"}, "text": "content-decoder", "orig": "content-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.907, "r_y0": 665.246, "r_x1": 545.116, "r_y1": 665.246, "r_x2": 545.116, "r_y2": 656.694, "r_x3": 376.907, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "uses the encoding of the image in combi-", "orig": "uses the encoding of the image in combi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 308.862, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "nation with the output encoding of each cell-tag (from the", "orig": "nation with the output encoding of each cell-tag (from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.013, "r_x1": 356.902, "r_y1": 689.013, "r_x2": 356.902, "r_y2": 680.425, "r_x3": 308.862, "r_y3": 680.425, "coord_origin": "TOPLEFT"}, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.131, "r_y0": 689.156, "r_x1": 360.449, "r_y1": 689.156, "r_x2": 360.449, "r_y2": 680.604, "r_x3": 357.131, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 364.045, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 364.045, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "to generate the textual content of each table", "orig": "to generate the textual content of each table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 325.739, "r_y1": 701.111, "r_x2": 325.739, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "cell.", "orig": "cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.746, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 331.746, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "The network architecture of IEDD is certainly more", "orig": "The network architecture of IEDD is certainly more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "elaborate, but it has the advantage that one can pre-train the", "orig": "elaborate, but it has the advantage that one can pre-train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Image-to-Text networks : In this type of network, one predicts a sequence of tokens starting from an encoded image. Such sequences of tokens can be HTML table tags [37, 17] or LaTeX symbols[10]. The choice of symbols is ultimately not very important, since one can be transformed into the other. There are however subtle variations in the Image-to-Text networks. The easiest network architectures are 'image-encoder \u2192 text-decoder' (IETD), similar to network architectures that try to provide captions to images [32]. In these IETD networks, one expects as output the LaTeX/HTML string of the entire table, i.e. the symbols necessary for creating the table with the content of the table. Another approach is the 'image-encoder \u2192 dual decoder' (IEDD) networks. In these type of networks, one has two consecutive decoders with different purposes. The first decoder is the tag-decoder , i.e. it only produces the HTML/LaTeX tags which construct an empty table. The second content-decoder uses the encoding of the image in combination with the output encoding of each cell-tag (from the tag-decoder ) to generate the textual content of each table cell. The network architecture of IEDD is certainly more elaborate, but it has the advantage that one can pre-train the"}, {"label": "page_footer", "id": 15, "page_no": 1, "cluster": {"id": 15, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8778094053268433, "cells": [{"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2"}], "body": [{"label": "text", "id": 12, "page_no": 1, "cluster": {"id": 12, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 286.365, "b": 95.98400000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9656890034675598, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "considered as a solved problem, given enough ground-truth", "orig": "considered as a solved problem, given enough ground-truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 95.98400000000004, "r_x1": 112.647, "r_y1": 95.98400000000004, "r_x2": 112.647, "r_y2": 87.43200000000002, "r_x3": 50.112, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "data to train on.", "orig": "data to train on.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "considered as a solved problem, given enough ground-truth data to train on."}, {"label": "text", "id": 4, "page_no": 1, "cluster": {"id": 4, "label": "text", "bbox": {"l": 50.112, "t": 99.84000000000003, "r": 286.365, "b": 227.94399999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9838606119155884, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 108.39200000000005, "r_x1": 286.365, "r_y1": 108.39200000000005, "r_x2": 286.365, "r_y2": 99.84000000000003, "r_x3": 62.067, "r_y3": 99.84000000000003, "coord_origin": "TOPLEFT"}, "text": "The second problem is called table-structure decompo-", "orig": "The second problem is called table-structure decompo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 120.34699999999998, "r_x1": 74.75, "r_y1": 120.34699999999998, "r_x2": 74.75, "r_y2": 111.79499999999996, "r_x3": 50.112, "r_y3": 111.79499999999996, "coord_origin": "TOPLEFT"}, "text": "sition.", "orig": "sition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.335, "r_y0": 120.34699999999998, "r_x1": 286.365, "r_y1": 120.34699999999998, "r_x2": 286.365, "r_y2": 111.79499999999996, "r_x3": 81.335, "r_y3": 111.79499999999996, "coord_origin": "TOPLEFT"}, "text": "The latter is a long standing problem in the com-", "orig": "The latter is a long standing problem in the com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 132.30200000000002, "r_x1": 235.117, "r_y1": 132.30200000000002, "r_x2": 235.117, "r_y2": 123.75, "r_x3": 50.112, "r_y3": 123.75, "coord_origin": "TOPLEFT"}, "text": "munity of document understanding [6, 4, 14].", "orig": "munity of document understanding [6, 4, 14].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.079, "r_y0": 132.30200000000002, "r_x1": 286.365, "r_y1": 132.30200000000002, "r_x2": 286.365, "r_y2": 123.75, "r_x3": 240.079, "r_y3": 123.75, "coord_origin": "TOPLEFT"}, "text": "Contrary to", "orig": "Contrary to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 144.25699999999995, "r_x1": 286.365, "r_y1": 144.25699999999995, "r_x2": 286.365, "r_y2": 135.70500000000004, "r_x3": 50.112, "r_y3": 135.70500000000004, "coord_origin": "TOPLEFT"}, "text": "the table-location problem, there are no commonly used ap-", "orig": "the table-location problem, there are no commonly used ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 156.21299999999997, "r_x1": 286.365, "r_y1": 156.21299999999997, "r_x2": 286.365, "r_y2": 147.66099999999994, "r_x3": 50.112, "r_y3": 147.66099999999994, "coord_origin": "TOPLEFT"}, "text": "proaches that can easily be re-purposed to solve this prob-", "orig": "proaches that can easily be re-purposed to solve this prob-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 168.168, "r_x1": 286.365, "r_y1": 168.168, "r_x2": 286.365, "r_y2": 159.61599999999999, "r_x3": 50.112, "r_y3": 159.61599999999999, "coord_origin": "TOPLEFT"}, "text": "lem. Lately, a set of new model-architectures has been pro-", "orig": "lem. Lately, a set of new model-architectures has been pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 180.12300000000005, "r_x1": 286.365, "r_y1": 180.12300000000005, "r_x2": 286.365, "r_y2": 171.57100000000003, "r_x3": 50.112, "r_y3": 171.57100000000003, "coord_origin": "TOPLEFT"}, "text": "posed by the community to address table-structure decom-", "orig": "posed by the community to address table-structure decom-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 192.07799999999997, "r_x1": 286.365, "r_y1": 192.07799999999997, "r_x2": 286.365, "r_y2": 183.52599999999995, "r_x3": 50.112, "r_y3": 183.52599999999995, "coord_origin": "TOPLEFT"}, "text": "position [37, 36, 18, 20]. All these models have some weak-", "orig": "position [37, 36, 18, 20]. All these models have some weak-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 204.03300000000002, "r_x1": 114.51, "r_y1": 204.03300000000002, "r_x2": 114.51, "r_y2": 195.481, "r_x3": 50.112, "r_y3": 195.481, "coord_origin": "TOPLEFT"}, "text": "nesses (see Sec.", "orig": "nesses (see Sec.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.163, "r_y0": 204.03300000000002, "r_x1": 129.952, "r_y1": 204.03300000000002, "r_x2": 129.952, "r_y2": 195.481, "r_x3": 119.163, "r_y3": 195.481, "coord_origin": "TOPLEFT"}, "text": "2).", "orig": "2).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.615, "r_y0": 204.03300000000002, "r_x1": 286.365, "r_y1": 204.03300000000002, "r_x2": 286.365, "r_y2": 195.481, "r_x3": 134.615, "r_y3": 195.481, "coord_origin": "TOPLEFT"}, "text": "The common denominator here is the", "orig": "The common denominator here is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 215.98800000000006, "r_x1": 286.365, "r_y1": 215.98800000000006, "r_x2": 286.365, "r_y2": 207.43600000000004, "r_x3": 50.112, "r_y3": 207.43600000000004, "coord_origin": "TOPLEFT"}, "text": "reliance on textual features and/or the inability to provide", "orig": "reliance on textual features and/or the inability to provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 227.94399999999996, "r_x1": 278.664, "r_y1": 227.94399999999996, "r_x2": 278.664, "r_y2": 219.39200000000005, "r_x3": 50.112, "r_y3": 219.39200000000005, "coord_origin": "TOPLEFT"}, "text": "the bounding box of each table-cell in the original image.", "orig": "the bounding box of each table-cell in the original image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The second problem is called table-structure decomposition. The latter is a long standing problem in the community of document understanding [6, 4, 14]. Contrary to the table-location problem, there are no commonly used approaches that can easily be re-purposed to solve this problem. Lately, a set of new model-architectures has been proposed by the community to address table-structure decomposition [37, 36, 18, 20]. All these models have some weaknesses (see Sec. 2). The common denominator here is the reliance on textual features and/or the inability to provide the bounding box of each table-cell in the original image."}, {"label": "text", "id": 2, "page_no": 1, "cluster": {"id": 2, "label": "text", "bbox": {"l": 50.112, "t": 231.79999999999995, "r": 286.365, "b": 371.859, "coord_origin": "TOPLEFT"}, "confidence": 0.9855920076370239, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 240.35199999999998, "r_x1": 286.365, "r_y1": 240.35199999999998, "r_x2": 286.365, "r_y2": 231.79999999999995, "r_x3": 62.067, "r_y3": 231.79999999999995, "coord_origin": "TOPLEFT"}, "text": "In this paper, we want to address these weaknesses and", "orig": "In this paper, we want to address these weaknesses and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 252.30700000000002, "r_x1": 78.884, "r_y1": 252.30700000000002, "r_x2": 78.884, "r_y2": 243.755, "r_x3": 50.112, "r_y3": 243.755, "coord_origin": "TOPLEFT"}, "text": "present", "orig": "present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 83.068, "r_y0": 252.30700000000002, "r_x1": 116.373, "r_y1": 252.30700000000002, "r_x2": 116.373, "r_y2": 243.755, "r_x3": 83.068, "r_y3": 243.755, "coord_origin": "TOPLEFT"}, "text": "a robust", "orig": "a robust", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 120.558, "r_y0": 252.30700000000002, "r_x1": 178.102, "r_y1": 252.30700000000002, "r_x2": 178.102, "r_y2": 243.755, "r_x3": 120.558, "r_y3": 243.755, "coord_origin": "TOPLEFT"}, "text": "table-structure", "orig": "table-structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.276, "r_y0": 252.30700000000002, "r_x1": 286.365, "r_y1": 252.30700000000002, "r_x2": 286.365, "r_y2": 243.755, "r_x3": 182.276, "r_y3": 243.755, "coord_origin": "TOPLEFT"}, "text": "decomposition algorithm.", "orig": "decomposition algorithm.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 264.26199999999994, "r_x1": 260.432, "r_y1": 264.26199999999994, "r_x2": 260.432, "r_y2": 255.71000000000004, "r_x3": 50.112, "r_y3": 255.71000000000004, "coord_origin": "TOPLEFT"}, "text": "The design criteria for our model are the following.", "orig": "The design criteria for our model are the following.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.603, "r_y0": 264.26199999999994, "r_x1": 286.365, "r_y1": 264.26199999999994, "r_x2": 286.365, "r_y2": 255.71000000000004, "r_x3": 265.603, "r_y3": 255.71000000000004, "coord_origin": "TOPLEFT"}, "text": "First,", "orig": "First,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 276.217, "r_x1": 286.365, "r_y1": 276.217, "r_x2": 286.365, "r_y2": 267.66499999999996, "r_x3": 50.112, "r_y3": 267.66499999999996, "coord_origin": "TOPLEFT"}, "text": "we want our algorithm to be language agnostic. In this way,", "orig": "we want our algorithm to be language agnostic. In this way,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 288.172, "r_x1": 286.365, "r_y1": 288.172, "r_x2": 286.365, "r_y2": 279.62, "r_x3": 50.112, "r_y3": 279.62, "coord_origin": "TOPLEFT"}, "text": "we can obtain the structure of any table, irregardless of the", "orig": "we can obtain the structure of any table, irregardless of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 300.128, "r_x1": 88.568, "r_y1": 300.128, "r_x2": 88.568, "r_y2": 291.576, "r_x3": 50.112, "r_y3": 291.576, "coord_origin": "TOPLEFT"}, "text": "language.", "orig": "language.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 95.502, "r_y0": 300.128, "r_x1": 286.365, "r_y1": 300.128, "r_x2": 286.365, "r_y2": 291.576, "r_x3": 95.502, "r_y3": 291.576, "coord_origin": "TOPLEFT"}, "text": "Second, we want our algorithm to leverage as", "orig": "Second, we want our algorithm to leverage as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 312.083, "r_x1": 286.365, "r_y1": 312.083, "r_x2": 286.365, "r_y2": 303.531, "r_x3": 50.112, "r_y3": 303.531, "coord_origin": "TOPLEFT"}, "text": "much data as possible from the original PDF document. For", "orig": "much data as possible from the original PDF document. For", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 324.038, "r_x1": 286.365, "r_y1": 324.038, "r_x2": 286.365, "r_y2": 315.486, "r_x3": 50.112, "r_y3": 315.486, "coord_origin": "TOPLEFT"}, "text": "programmatic PDF documents, the text-cells can often be", "orig": "programmatic PDF documents, the text-cells can often be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 335.993, "r_x1": 286.365, "r_y1": 335.993, "r_x2": 286.365, "r_y2": 327.441, "r_x3": 50.112, "r_y3": 327.441, "coord_origin": "TOPLEFT"}, "text": "extracted much faster and with higher accuracy compared", "orig": "extracted much faster and with higher accuracy compared", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 347.948, "r_x1": 286.365, "r_y1": 347.948, "r_x2": 286.365, "r_y2": 339.396, "r_x3": 50.112, "r_y3": 339.396, "coord_origin": "TOPLEFT"}, "text": "to OCR methods. Last but not least, we want to have a di-", "orig": "to OCR methods. Last but not least, we want to have a di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 359.904, "r_x1": 286.365, "r_y1": 359.904, "r_x2": 286.365, "r_y2": 351.352, "r_x3": 50.112, "r_y3": 351.352, "coord_origin": "TOPLEFT"}, "text": "rect link between the table-cell and its bounding box in the", "orig": "rect link between the table-cell and its bounding box in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 371.859, "r_x1": 76.951, "r_y1": 371.859, "r_x2": 76.951, "r_y2": 363.307, "r_x3": 50.112, "r_y3": 363.307, "coord_origin": "TOPLEFT"}, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In this paper, we want to address these weaknesses and present a robust table-structure decomposition algorithm. The design criteria for our model are the following. First, we want our algorithm to be language agnostic. In this way, we can obtain the structure of any table, irregardless of the language. Second, we want our algorithm to leverage as much data as possible from the original PDF document. For programmatic PDF documents, the text-cells can often be extracted much faster and with higher accuracy compared to OCR methods. Last but not least, we want to have a direct link between the table-cell and its bounding box in the image."}, {"label": "text", "id": 7, "page_no": 1, "cluster": {"id": 7, "label": "text", "bbox": {"l": 50.112, "t": 375.715, "r": 286.367, "b": 432.087, "coord_origin": "TOPLEFT"}, "confidence": 0.9820111393928528, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 384.267, "r_x1": 286.365, "r_y1": 384.267, "r_x2": 286.365, "r_y2": 375.715, "r_x3": 62.067, "r_y3": 375.715, "coord_origin": "TOPLEFT"}, "text": "To meet the design criteria listed above, we developed a", "orig": "To meet the design criteria listed above, we developed a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 396.222, "r_x1": 120.986, "r_y1": 396.222, "r_x2": 120.986, "r_y2": 387.67, "r_x3": 50.112, "r_y3": 387.67, "coord_origin": "TOPLEFT"}, "text": "new model called", "orig": "new model called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 123.901, "r_y0": 396.238, "r_x1": 179.731, "r_y1": 396.238, "r_x2": 179.731, "r_y2": 387.282, "r_x3": 123.901, "r_y3": 387.282, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.646, "r_y0": 396.222, "r_x1": 286.367, "r_y1": 396.222, "r_x2": 286.367, "r_y2": 387.67, "r_x3": 182.646, "r_y3": 387.67, "coord_origin": "TOPLEFT"}, "text": "and a synthetically gener-", "orig": "and a synthetically gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 408.177, "r_x1": 181.758, "r_y1": 408.177, "r_x2": 181.758, "r_y2": 399.625, "r_x3": 50.112, "r_y3": 399.625, "coord_origin": "TOPLEFT"}, "text": "ated table structure dataset called", "orig": "ated table structure dataset called", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.104, "r_y0": 408.193, "r_x1": 240.203, "r_y1": 408.193, "r_x2": 240.203, "r_y2": 399.237, "r_x3": 184.104, "r_y3": 399.237, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.204, "r_y0": 403.942, "r_x1": 243.691, "r_y1": 403.942, "r_x2": 243.691, "r_y2": 397.956, "r_x3": 240.204, "r_y3": 397.956, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 244.189, "r_y0": 408.177, "r_x1": 246.68, "r_y1": 408.177, "r_x2": 246.68, "r_y2": 399.625, "r_x3": 244.189, "r_y3": 399.625, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.718, "r_y0": 408.177, "r_x1": 286.361, "r_y1": 408.177, "r_x2": 286.361, "r_y2": 399.625, "r_x3": 249.718, "r_y3": 399.625, "coord_origin": "TOPLEFT"}, "text": "In partic-", "orig": "In partic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 420.132, "r_x1": 67.696, "r_y1": 420.132, "r_x2": 67.696, "r_y2": 411.58, "r_x3": 50.112, "r_y3": 411.58, "coord_origin": "TOPLEFT"}, "text": "ular,", "orig": "ular,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 71.322, "r_y0": 420.132, "r_x1": 286.365, "r_y1": 420.132, "r_x2": 286.365, "r_y2": 411.58, "r_x3": 71.322, "r_y3": 411.58, "coord_origin": "TOPLEFT"}, "text": "our contributions in this work can be summarised as", "orig": "our contributions in this work can be summarised as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 432.087, "r_x1": 82.52, "r_y1": 432.087, "r_x2": 82.52, "r_y2": 423.535, "r_x3": 50.112, "r_y3": 423.535, "coord_origin": "TOPLEFT"}, "text": "follows:", "orig": "follows:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "To meet the design criteria listed above, we developed a new model called TableFormer and a synthetically generated table structure dataset called SynthTabNet 1 . In particular, our contributions in this work can be summarised as follows:"}, {"label": "list_item", "id": 6, "page_no": 1, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 61.569, "t": 444.432, "r": 286.365, "b": 489.237, "coord_origin": "TOPLEFT"}, "confidence": 0.9822162389755249, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 453.372, "r_x1": 65.056, "r_y1": 453.372, "r_x2": 65.056, "r_y2": 444.82, "r_x3": 61.569, "r_y3": 444.82, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 453.372, "r_x1": 117.101, "r_y1": 453.372, "r_x2": 117.101, "r_y2": 444.82, "r_x3": 70.037, "r_y3": 444.82, "coord_origin": "TOPLEFT"}, "text": "We propose", "orig": "We propose", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.59, "r_y0": 453.388, "r_x1": 175.42, "r_y1": 453.388, "r_x2": 175.42, "r_y2": 444.432, "r_x3": 119.59, "r_y3": 444.432, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.421, "r_y0": 453.372, "r_x1": 286.365, "r_y1": 453.372, "r_x2": 286.365, "r_y2": 444.82, "r_x3": 175.421, "r_y3": 444.82, "coord_origin": "TOPLEFT"}, "text": ", a transformer based model", "orig": ", a transformer based model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 465.327, "r_x1": 286.365, "r_y1": 465.327, "r_x2": 286.365, "r_y2": 456.775, "r_x3": 70.037, "r_y3": 456.775, "coord_origin": "TOPLEFT"}, "text": "that predicts tables structure and bounding boxes for", "orig": "that predicts tables structure and bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 477.282, "r_x1": 286.365, "r_y1": 477.282, "r_x2": 286.365, "r_y2": 468.73, "r_x3": 70.037, "r_y3": 468.73, "coord_origin": "TOPLEFT"}, "text": "the table content simultaneously in an end-to-end ap-", "orig": "the table content simultaneously in an end-to-end ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 489.237, "r_x1": 99.636, "r_y1": 489.237, "r_x2": 99.636, "r_y2": 480.685, "r_x3": 70.037, "r_y3": 480.685, "coord_origin": "TOPLEFT"}, "text": "proach.", "orig": "proach.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u00b7 We propose TableFormer , a transformer based model that predicts tables structure and bounding boxes for the table content simultaneously in an end-to-end approach."}, {"label": "list_item", "id": 5, "page_no": 1, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 61.569, "t": 502.034, "r": 286.365, "b": 546.84, "coord_origin": "TOPLEFT"}, "confidence": 0.982271671295166, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 510.974, "r_x1": 65.056, "r_y1": 510.974, "r_x2": 65.056, "r_y2": 502.422, "r_x3": 61.569, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 510.974, "r_x1": 111.88, "r_y1": 510.974, "r_x2": 111.88, "r_y2": 502.422, "r_x3": 70.037, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "Across all", "orig": "Across all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.084, "r_y0": 510.974, "r_x1": 196.104, "r_y1": 510.974, "r_x2": 196.104, "r_y2": 502.422, "r_x3": 116.084, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "benchmark datasets", "orig": "benchmark datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.31, "r_y0": 510.99, "r_x1": 256.14, "r_y1": 510.99, "r_x2": 256.14, "r_y2": 502.034, "r_x3": 200.31, "r_y3": 502.034, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 260.35, "r_y0": 510.974, "r_x1": 286.362, "r_y1": 510.974, "r_x2": 286.362, "r_y2": 502.422, "r_x3": 260.35, "r_y3": 502.422, "coord_origin": "TOPLEFT"}, "text": "signif-", "orig": "signif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 522.929, "r_x1": 97.155, "r_y1": 522.929, "r_x2": 97.155, "r_y2": 514.377, "r_x3": 70.037, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "icantly", "orig": "icantly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.678, "r_y0": 522.929, "r_x1": 150.375, "r_y1": 522.929, "r_x2": 150.375, "r_y2": 514.377, "r_x3": 101.678, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "outperforms", "orig": "outperforms", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.898, "r_y0": 522.929, "r_x1": 186.301, "r_y1": 522.929, "r_x2": 186.301, "r_y2": 514.377, "r_x3": 154.898, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "existing", "orig": "existing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 190.824, "r_y0": 522.929, "r_x1": 250.021, "r_y1": 522.929, "r_x2": 250.021, "r_y2": 514.377, "r_x3": 190.824, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "state-of-the-art", "orig": "state-of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 254.544, "r_y0": 522.929, "r_x1": 286.365, "r_y1": 522.929, "r_x2": 286.365, "r_y2": 514.377, "r_x3": 254.544, "r_y3": 514.377, "coord_origin": "TOPLEFT"}, "text": "metrics,", "orig": "metrics,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 534.885, "r_x1": 286.365, "r_y1": 534.885, "r_x2": 286.365, "r_y2": 526.3330000000001, "r_x3": 70.037, "r_y3": 526.3330000000001, "coord_origin": "TOPLEFT"}, "text": "while being much more efficient in training and infer-", "orig": "while being much more efficient in training and infer-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 546.84, "r_x1": 161.653, "r_y1": 546.84, "r_x2": 161.653, "r_y2": 538.288, "r_x3": 70.037, "r_y3": 538.288, "coord_origin": "TOPLEFT"}, "text": "ence to existing works.", "orig": "ence to existing works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u00b7 Across all benchmark datasets TableFormer significantly outperforms existing state-of-the-art metrics, while being much more efficient in training and inference to existing works."}, {"label": "list_item", "id": 9, "page_no": 1, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 61.569, "t": 559.637, "r": 286.365, "b": 592.487, "coord_origin": "TOPLEFT"}, "confidence": 0.9802963733673096, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 568.577, "r_x1": 65.056, "r_y1": 568.577, "r_x2": 65.056, "r_y2": 560.025, "r_x3": 61.569, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 568.577, "r_x1": 116.712, "r_y1": 568.577, "r_x2": 116.712, "r_y2": 560.025, "r_x3": 70.037, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "We present", "orig": "We present", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 121.583, "r_y0": 568.593, "r_x1": 177.682, "r_y1": 568.593, "r_x2": 177.682, "r_y2": 559.637, "r_x3": 121.583, "r_y3": 559.637, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.553, "r_y0": 568.577, "r_x1": 186.976, "r_y1": 568.577, "r_x2": 186.976, "r_y2": 560.025, "r_x3": 182.553, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 191.848, "r_y0": 568.577, "r_x1": 242.767, "r_y1": 568.577, "r_x2": 242.767, "r_y2": 560.025, "r_x3": 191.848, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "synthetically", "orig": "synthetically", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.639, "r_y0": 568.577, "r_x1": 286.363, "r_y1": 568.577, "r_x2": 286.363, "r_y2": 560.025, "r_x3": 247.639, "r_y3": 560.025, "coord_origin": "TOPLEFT"}, "text": "generated", "orig": "generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 580.532, "r_x1": 286.365, "r_y1": 580.532, "r_x2": 286.365, "r_y2": 571.98, "r_x3": 70.037, "r_y3": 571.98, "coord_origin": "TOPLEFT"}, "text": "dataset, with various appearance styles and complex-", "orig": "dataset, with various appearance styles and complex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 592.487, "r_x1": 82.401, "r_y1": 592.487, "r_x2": 82.401, "r_y2": 583.935, "r_x3": 70.037, "r_y3": 583.935, "coord_origin": "TOPLEFT"}, "text": "ity.", "orig": "ity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u00b7 We present SynthTabNet a synthetically generated dataset, with various appearance styles and complexity."}, {"label": "list_item", "id": 8, "page_no": 1, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 61.569, "t": 605.672, "r": 286.365, "b": 638.135, "coord_origin": "TOPLEFT"}, "confidence": 0.9806395173072815, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 614.2239999999999, "r_x1": 65.056, "r_y1": 614.2239999999999, "r_x2": 65.056, "r_y2": 605.672, "r_x3": 61.569, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 614.2239999999999, "r_x1": 132.005, "r_y1": 614.2239999999999, "r_x2": 132.005, "r_y2": 605.672, "r_x3": 70.037, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "An augmented", "orig": "An augmented", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.082, "r_y0": 614.2239999999999, "r_x1": 165.748, "r_y1": 614.2239999999999, "r_x2": 165.748, "r_y2": 605.672, "r_x3": 138.082, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "dataset", "orig": "dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.815, "r_y0": 614.2239999999999, "r_x1": 194.5, "r_y1": 614.2239999999999, "r_x2": 194.5, "r_y2": 605.672, "r_x3": 171.815, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "based", "orig": "based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.577, "r_y0": 614.2239999999999, "r_x1": 210.54, "r_y1": 614.2239999999999, "r_x2": 210.54, "r_y2": 605.672, "r_x3": 200.577, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "on", "orig": "on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.617, "r_y0": 614.2239999999999, "r_x1": 261.2, "r_y1": 614.2239999999999, "r_x2": 261.2, "r_y2": 605.672, "r_x3": 216.617, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 267.277, "r_y0": 614.2239999999999, "r_x1": 286.365, "r_y1": 614.2239999999999, "r_x2": 286.365, "r_y2": 605.672, "r_x3": 267.277, "r_y3": 605.672, "coord_origin": "TOPLEFT"}, "text": "[37],", "orig": "[37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 626.179, "r_x1": 135.521, "r_y1": 626.179, "r_x2": 135.521, "r_y2": 617.627, "r_x3": 70.037, "r_y3": 617.627, "coord_origin": "TOPLEFT"}, "text": "FinTabNet [36],", "orig": "FinTabNet [36],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.925, "r_y0": 626.179, "r_x1": 286.365, "r_y1": 626.179, "r_x2": 286.365, "r_y2": 617.627, "r_x3": 139.925, "r_y3": 617.627, "coord_origin": "TOPLEFT"}, "text": "and TableBank [17] with generated", "orig": "and TableBank [17] with generated", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 638.135, "r_x1": 198.056, "r_y1": 638.135, "r_x2": 198.056, "r_y2": 629.583, "r_x3": 70.037, "r_y3": 629.583, "coord_origin": "TOPLEFT"}, "text": "ground-truth for reproducibility.", "orig": "ground-truth for reproducibility.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u00b7 An augmented dataset based on PubTabNet [37], FinTabNet [36], and TableBank [17] with generated ground-truth for reproducibility."}, {"label": "text", "id": 11, "page_no": 1, "cluster": {"id": 11, "label": "text", "bbox": {"l": 50.112, "t": 650.867, "r": 286.365, "b": 695.284, "coord_origin": "TOPLEFT"}, "confidence": 0.9742533564567566, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 659.419, "r_x1": 204.452, "r_y1": 659.419, "r_x2": 204.452, "r_y2": 650.867, "r_x3": 62.067, "r_y3": 650.867, "coord_origin": "TOPLEFT"}, "text": "The paper is structured as follows.", "orig": "The paper is structured as follows.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.789, "r_y0": 659.419, "r_x1": 286.365, "r_y1": 659.419, "r_x2": 286.365, "r_y2": 650.867, "r_x3": 210.789, "r_y3": 650.867, "coord_origin": "TOPLEFT"}, "text": "In Sec. 2, we give", "orig": "In Sec. 2, we give", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 671.374, "r_x1": 240.896, "r_y1": 671.374, "r_x2": 240.896, "r_y2": 662.822, "r_x3": 50.112, "r_y3": 662.822, "coord_origin": "TOPLEFT"}, "text": "a brief overview of the current state-of-the-art.", "orig": "a brief overview of the current state-of-the-art.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.833, "r_y0": 671.374, "r_x1": 286.365, "r_y1": 671.374, "r_x2": 286.365, "r_y2": 662.822, "r_x3": 246.833, "r_y3": 662.822, "coord_origin": "TOPLEFT"}, "text": "In Sec. 3,", "orig": "In Sec. 3,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 683.329, "r_x1": 227.396, "r_y1": 683.329, "r_x2": 227.396, "r_y2": 674.777, "r_x3": 50.112, "r_y3": 674.777, "coord_origin": "TOPLEFT"}, "text": "we describe the datasets on which we train.", "orig": "we describe the datasets on which we train.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.467, "r_y0": 683.329, "r_x1": 286.365, "r_y1": 683.329, "r_x2": 286.365, "r_y2": 674.777, "r_x3": 232.467, "r_y3": 674.777, "coord_origin": "TOPLEFT"}, "text": "In Sec. 4, we", "orig": "In Sec. 4, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 695.284, "r_x1": 286.365, "r_y1": 695.284, "r_x2": 286.365, "r_y2": 686.732, "r_x3": 50.112, "r_y3": 686.732, "coord_origin": "TOPLEFT"}, "text": "introduce the TableFormer model-architecture and describe", "orig": "introduce the TableFormer model-architecture and describe", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The paper is structured as follows. In Sec. 2, we give a brief overview of the current state-of-the-art. In Sec. 3, we describe the datasets on which we train. In Sec. 4, we introduce the TableFormer model-architecture and describe"}, {"label": "footnote", "id": 14, "page_no": 1, "cluster": {"id": 14, "label": "footnote", "bbox": {"l": 60.971, "t": 704.296, "r": 183.731, "b": 712.653, "coord_origin": "TOPLEFT"}, "confidence": 0.895367443561554, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.971, "r_y0": 709.427, "r_x1": 63.96, "r_y1": 709.427, "r_x2": 63.96, "r_y2": 704.296, "r_x3": 60.971, "r_y3": 704.296, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 64.458, "r_y0": 712.653, "r_x1": 183.731, "r_y1": 712.653, "r_x2": 183.731, "r_y2": 705.811, "r_x3": 64.458, "r_y3": 705.811, "coord_origin": "TOPLEFT"}, "text": "https://github.com/IBM/SynthTabNet", "orig": "https://github.com/IBM/SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1 https://github.com/IBM/SynthTabNet"}, {"label": "text", "id": 10, "page_no": 1, "cluster": {"id": 10, "label": "text", "bbox": {"l": 308.862, "t": 75.47699999999998, "r": 545.115, "b": 107.93899999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9774322509765625, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 545.115, "r_y1": 84.029, "r_x2": 545.115, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "its results &performance in Sec. 5. As a conclusion, we de-", "orig": "its results &performance in Sec. 5. As a conclusion, we de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 95.98400000000004, "r_x1": 545.115, "r_y1": 95.98400000000004, "r_x2": 545.115, "r_y2": 87.43200000000002, "r_x3": 308.862, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "scribe how this new model-architecture can be re-purposed", "orig": "scribe how this new model-architecture can be re-purposed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 107.93899999999996, "r_x1": 508.084, "r_y1": 107.93899999999996, "r_x2": 508.084, "r_y2": 99.38699999999994, "r_x3": 308.862, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "for other tasks in the computer-vision community.", "orig": "for other tasks in the computer-vision community.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "its results &performance in Sec. 5. As a conclusion, we describe how this new model-architecture can be re-purposed for other tasks in the computer-vision community."}, {"label": "section_header", "id": 13, "page_no": 1, "cluster": {"id": 13, "label": "section_header", "bbox": {"l": 308.862, "t": 121.73199999999997, "r": 498.28, "b": 132.48000000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9428724646568298, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 132.48000000000002, "r_x1": 498.28, "r_y1": 132.48000000000002, "r_x2": 498.28, "r_y2": 121.73199999999997, "r_x3": 308.862, "r_y3": 121.73199999999997, "coord_origin": "TOPLEFT"}, "text": "2. Previous work and State of the Art", "orig": "2. Previous work and State of the Art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2. Previous work and State of the Art"}, {"label": "text", "id": 0, "page_no": 1, "cluster": {"id": 0, "label": "text", "bbox": {"l": 308.862, "t": 142.49, "r": 545.115, "b": 330.369, "coord_origin": "TOPLEFT"}, "confidence": 0.987194836139679, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 151.04200000000003, "r_x1": 545.115, "r_y1": 151.04200000000003, "r_x2": 545.115, "r_y2": 142.49, "r_x3": 320.817, "r_y3": 142.49, "coord_origin": "TOPLEFT"}, "text": "Identifying the structure of a table has been an outstand-", "orig": "Identifying the structure of a table has been an outstand-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 162.99699999999996, "r_x1": 545.115, "r_y1": 162.99699999999996, "r_x2": 545.115, "r_y2": 154.44500000000005, "r_x3": 308.862, "r_y3": 154.44500000000005, "coord_origin": "TOPLEFT"}, "text": "ing problem in the document-parsing community, that mo-", "orig": "ing problem in the document-parsing community, that mo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 174.952, "r_x1": 334.376, "r_y1": 174.952, "r_x2": 334.376, "r_y2": 166.39999999999998, "r_x3": 308.862, "r_y3": 166.39999999999998, "coord_origin": "TOPLEFT"}, "text": "tivates", "orig": "tivates", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.192, "r_y0": 174.952, "r_x1": 522.56, "r_y1": 174.952, "r_x2": 522.56, "r_y2": 166.39999999999998, "r_x3": 338.192, "r_y3": 166.39999999999998, "coord_origin": "TOPLEFT"}, "text": "many organised public challenges [6, 4, 14].", "orig": "many organised public challenges [6, 4, 14].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 529.623, "r_y0": 174.952, "r_x1": 545.115, "r_y1": 174.952, "r_x2": 545.115, "r_y2": 166.39999999999998, "r_x3": 529.623, "r_y3": 166.39999999999998, "coord_origin": "TOPLEFT"}, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 186.90700000000004, "r_x1": 545.115, "r_y1": 186.90700000000004, "r_x2": 545.115, "r_y2": 178.35500000000002, "r_x3": 308.862, "r_y3": 178.35500000000002, "coord_origin": "TOPLEFT"}, "text": "difficulty of the problem can be attributed to a number of", "orig": "difficulty of the problem can be attributed to a number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 198.86199999999997, "r_x1": 545.115, "r_y1": 198.86199999999997, "r_x2": 545.115, "r_y2": 190.30999999999995, "r_x3": 308.862, "r_y3": 190.30999999999995, "coord_origin": "TOPLEFT"}, "text": "factors. First, there is a large variety in the shapes and sizes", "orig": "factors. First, there is a large variety in the shapes and sizes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 210.817, "r_x1": 346.979, "r_y1": 210.817, "r_x2": 346.979, "r_y2": 202.265, "r_x3": 308.862, "r_y3": 202.265, "coord_origin": "TOPLEFT"}, "text": "of tables.", "orig": "of tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.869, "r_y0": 210.817, "r_x1": 508.642, "r_y1": 210.817, "r_x2": 508.642, "r_y2": 202.265, "r_x3": 354.869, "r_y3": 202.265, "coord_origin": "TOPLEFT"}, "text": "Such large variety requires a flexible", "orig": "Such large variety requires a flexible", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.737, "r_y0": 210.817, "r_x1": 545.115, "r_y1": 210.817, "r_x2": 545.115, "r_y2": 202.265, "r_x3": 512.737, "r_y3": 202.265, "coord_origin": "TOPLEFT"}, "text": "method.", "orig": "method.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 222.77300000000002, "r_x1": 545.115, "r_y1": 222.77300000000002, "r_x2": 545.115, "r_y2": 214.221, "r_x3": 308.862, "r_y3": 214.221, "coord_origin": "TOPLEFT"}, "text": "This is especially true for complex column- and row head-", "orig": "This is especially true for complex column- and row head-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 234.72799999999995, "r_x1": 322.969, "r_y1": 234.72799999999995, "r_x2": 322.969, "r_y2": 226.17600000000004, "r_x3": 308.862, "r_y3": 226.17600000000004, "coord_origin": "TOPLEFT"}, "text": "ers,", "orig": "ers,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.084, "r_y0": 234.72799999999995, "r_x1": 530.918, "r_y1": 234.72799999999995, "r_x2": 530.918, "r_y2": 226.17600000000004, "r_x3": 327.084, "r_y3": 226.17600000000004, "coord_origin": "TOPLEFT"}, "text": "which can be extremely intricate and demanding.", "orig": "which can be extremely intricate and demanding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 537.922, "r_y0": 234.72799999999995, "r_x1": 545.115, "r_y1": 234.72799999999995, "r_x2": 545.115, "r_y2": 226.17600000000004, "r_x3": 537.922, "r_y3": 226.17600000000004, "coord_origin": "TOPLEFT"}, "text": "A", "orig": "A", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 246.683, "r_x1": 545.115, "r_y1": 246.683, "r_x2": 545.115, "r_y2": 238.13099999999997, "r_x3": 308.862, "r_y3": 238.13099999999997, "coord_origin": "TOPLEFT"}, "text": "second factor of complexity is the lack of data with regard", "orig": "second factor of complexity is the lack of data with regard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.63800000000003, "r_x1": 545.115, "r_y1": 258.63800000000003, "r_x2": 545.115, "r_y2": 250.086, "r_x3": 308.862, "r_y3": 250.086, "coord_origin": "TOPLEFT"}, "text": "to table-structure. Until the publication of PubTabNet [37],", "orig": "to table-structure. Until the publication of PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 270.59299999999996, "r_x1": 439.84, "r_y1": 270.59299999999996, "r_x2": 439.84, "r_y2": 262.04100000000005, "r_x3": 308.862, "r_y3": 262.04100000000005, "coord_origin": "TOPLEFT"}, "text": "there were no large datasets (i.e.", "orig": "there were no large datasets (i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 444.44, "r_y0": 270.429, "r_x1": 452.189, "r_y1": 270.429, "r_x2": 452.189, "r_y2": 261.72299999999996, "r_x3": 444.44, "r_y3": 261.72299999999996, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.89, "r_y0": 270.429, "r_x1": 470.834, "r_y1": 270.429, "r_x2": 470.834, "r_y2": 261.72299999999996, "r_x3": 455.89, "r_y3": 261.72299999999996, "coord_origin": "TOPLEFT"}, "text": "100", "orig": "100", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 470.834, "r_y0": 270.59299999999996, "r_x1": 545.115, "r_y1": 270.59299999999996, "r_x2": 545.115, "r_y2": 262.04100000000005, "r_x3": 470.834, "r_y3": 262.04100000000005, "coord_origin": "TOPLEFT"}, "text": "K tables) that pro-", "orig": "K tables) that pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 282.548, "r_x1": 545.115, "r_y1": 282.548, "r_x2": 545.115, "r_y2": 273.996, "r_x3": 308.862, "r_y3": 273.996, "coord_origin": "TOPLEFT"}, "text": "vided structure information. This happens primarily due to", "orig": "vided structure information. This happens primarily due to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 294.504, "r_x1": 545.115, "r_y1": 294.504, "r_x2": 545.115, "r_y2": 285.952, "r_x3": 308.862, "r_y3": 285.952, "coord_origin": "TOPLEFT"}, "text": "the fact that tables are notoriously time-consuming to an-", "orig": "the fact that tables are notoriously time-consuming to an-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 306.459, "r_x1": 545.115, "r_y1": 306.459, "r_x2": 545.115, "r_y2": 297.907, "r_x3": 308.862, "r_y3": 297.907, "coord_origin": "TOPLEFT"}, "text": "notate by hand. However, this has definitely changed in re-", "orig": "notate by hand. However, this has definitely changed in re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 318.414, "r_x1": 545.115, "r_y1": 318.414, "r_x2": 545.115, "r_y2": 309.862, "r_x3": 308.862, "r_y3": 309.862, "coord_origin": "TOPLEFT"}, "text": "cent years with the deliverance of PubTabNet [37], FinTab-", "orig": "cent years with the deliverance of PubTabNet [37], FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 330.369, "r_x1": 425.923, "r_y1": 330.369, "r_x2": 425.923, "r_y2": 321.817, "r_x3": 308.862, "r_y3": 321.817, "coord_origin": "TOPLEFT"}, "text": "Net [36], TableBank [17] etc.", "orig": "Net [36], TableBank [17] etc.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Identifying the structure of a table has been an outstanding problem in the document-parsing community, that motivates many organised public challenges [6, 4, 14]. The difficulty of the problem can be attributed to a number of factors. First, there is a large variety in the shapes and sizes of tables. Such large variety requires a flexible method. This is especially true for complex column- and row headers, which can be extremely intricate and demanding. A second factor of complexity is the lack of data with regard to table-structure. Until the publication of PubTabNet [37], there were no large datasets (i.e. > 100 K tables) that provided structure information. This happens primarily due to the fact that tables are notoriously time-consuming to annotate by hand. However, this has definitely changed in recent years with the deliverance of PubTabNet [37], FinTabNet [36], TableBank [17] etc."}, {"label": "text", "id": 1, "page_no": 1, "cluster": {"id": 1, "label": "text", "bbox": {"l": 308.862, "t": 333.838, "r": 545.115, "b": 449.987, "coord_origin": "TOPLEFT"}, "confidence": 0.9869040250778198, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 342.39, "r_x1": 391.492, "r_y1": 342.39, "r_x2": 391.492, "r_y2": 333.838, "r_x3": 320.817, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "Before the rising", "orig": "Before the rising", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.845, "r_y0": 342.39, "r_x1": 436.802, "r_y1": 342.39, "r_x2": 436.802, "r_y2": 333.838, "r_x3": 395.845, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "popularity", "orig": "popularity", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.145, "r_y0": 342.39, "r_x1": 449.444, "r_y1": 342.39, "r_x2": 449.444, "r_y2": 333.838, "r_x3": 441.145, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.798, "r_y0": 342.39, "r_x1": 545.115, "r_y1": 342.39, "r_x2": 545.115, "r_y2": 333.838, "r_x3": 453.798, "r_y3": 333.838, "coord_origin": "TOPLEFT"}, "text": "deep neural networks,", "orig": "deep neural networks,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 354.345, "r_x1": 545.115, "r_y1": 354.345, "r_x2": 545.115, "r_y2": 345.793, "r_x3": 308.862, "r_y3": 345.793, "coord_origin": "TOPLEFT"}, "text": "the community relied heavily on heuristic and/or statistical", "orig": "the community relied heavily on heuristic and/or statistical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 366.3, "r_x1": 545.115, "r_y1": 366.3, "r_x2": 545.115, "r_y2": 357.748, "r_x3": 308.862, "r_y3": 357.748, "coord_origin": "TOPLEFT"}, "text": "methods to do table structure identification [3, 7, 11, 5, 13,", "orig": "methods to do table structure identification [3, 7, 11, 5, 13,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 378.256, "r_x1": 324.633, "r_y1": 378.256, "r_x2": 324.633, "r_y2": 369.704, "r_x3": 308.862, "r_y3": 369.704, "coord_origin": "TOPLEFT"}, "text": "28].", "orig": "28].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 329.634, "r_y0": 378.256, "r_x1": 545.115, "r_y1": 378.256, "r_x2": 545.115, "r_y2": 369.704, "r_x3": 329.634, "r_y3": 369.704, "coord_origin": "TOPLEFT"}, "text": "Although such methods work well on constrained ta-", "orig": "Although such methods work well on constrained ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 390.211, "r_x1": 545.115, "r_y1": 390.211, "r_x2": 545.115, "r_y2": 381.659, "r_x3": 308.862, "r_y3": 381.659, "coord_origin": "TOPLEFT"}, "text": "bles [12], a more data-driven approach can be applied due", "orig": "bles [12], a more data-driven approach can be applied due", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 402.166, "r_x1": 545.115, "r_y1": 402.166, "r_x2": 545.115, "r_y2": 393.614, "r_x3": 308.862, "r_y3": 393.614, "coord_origin": "TOPLEFT"}, "text": "to the advent of convolutional neural networks (CNNs) and", "orig": "to the advent of convolutional neural networks (CNNs) and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 414.121, "r_x1": 438.416, "r_y1": 414.121, "r_x2": 438.416, "r_y2": 405.569, "r_x3": 308.862, "r_y3": 405.569, "coord_origin": "TOPLEFT"}, "text": "the availability of large datasets.", "orig": "the availability of large datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.231, "r_y0": 414.121, "r_x1": 545.115, "r_y1": 414.121, "r_x2": 545.115, "r_y2": 405.569, "r_x3": 442.231, "r_y3": 405.569, "coord_origin": "TOPLEFT"}, "text": "To the best-of-our knowl-", "orig": "To the best-of-our knowl-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 426.076, "r_x1": 545.115, "r_y1": 426.076, "r_x2": 545.115, "r_y2": 417.524, "r_x3": 308.862, "r_y3": 417.524, "coord_origin": "TOPLEFT"}, "text": "edge, there are currently two different types of network ar-", "orig": "edge, there are currently two different types of network ar-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 438.032, "r_x1": 545.115, "r_y1": 438.032, "r_x2": 545.115, "r_y2": 429.48, "r_x3": 308.862, "r_y3": 429.48, "coord_origin": "TOPLEFT"}, "text": "chitecture that are being pursued for state-of-the-art table-", "orig": "chitecture that are being pursued for state-of-the-art table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 449.987, "r_x1": 401.285, "r_y1": 449.987, "r_x2": 401.285, "r_y2": 441.435, "r_x3": 308.862, "r_y3": 441.435, "coord_origin": "TOPLEFT"}, "text": "structure identification.", "orig": "structure identification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Before the rising popularity of deep neural networks, the community relied heavily on heuristic and/or statistical methods to do table structure identification [3, 7, 11, 5, 13, 28]. Although such methods work well on constrained tables [12], a more data-driven approach can be applied due to the advent of convolutional neural networks (CNNs) and the availability of large datasets. To the best-of-our knowledge, there are currently two different types of network architecture that are being pursued for state-of-the-art tablestructure identification."}, {"label": "text", "id": 3, "page_no": 1, "cluster": {"id": 3, "label": "text", "bbox": {"l": 308.862, "t": 453.068, "r": 545.117, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9843218326568604, "cells": [{"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 462.024, "r_x1": 423.262, "r_y1": 462.024, "r_x2": 423.262, "r_y2": 453.068, "r_x3": 320.817, "r_y3": 453.068, "coord_origin": "TOPLEFT"}, "text": "Image-to-Text networks", "orig": "Image-to-Text networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.267, "r_y0": 462.008, "r_x1": 426.037, "r_y1": 462.008, "r_x2": 426.037, "r_y2": 453.456, "r_x3": 423.267, "r_y3": 453.456, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.769, "r_y0": 462.008, "r_x1": 545.11, "r_y1": 462.008, "r_x2": 545.11, "r_y2": 453.456, "r_x3": 430.769, "r_y3": 453.456, "coord_origin": "TOPLEFT"}, "text": "In this type of network, one", "orig": "In this type of network, one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 473.963, "r_x1": 340.404, "r_y1": 473.963, "r_x2": 340.404, "r_y2": 465.411, "r_x3": 308.862, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "predicts", "orig": "predicts", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.116, "r_y0": 473.963, "r_x1": 349.539, "r_y1": 473.963, "r_x2": 349.539, "r_y2": 465.411, "r_x3": 345.116, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.252, "r_y0": 473.963, "r_x1": 390.765, "r_y1": 473.963, "r_x2": 390.765, "r_y2": 465.411, "r_x3": 354.252, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "sequence", "orig": "sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.477, "r_y0": 473.963, "r_x1": 403.776, "r_y1": 473.963, "r_x2": 403.776, "r_y2": 465.411, "r_x3": 395.477, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.488, "r_y0": 473.963, "r_x1": 434.401, "r_y1": 473.963, "r_x2": 434.401, "r_y2": 465.411, "r_x3": 408.488, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.113, "r_y0": 473.963, "r_x1": 469.001, "r_y1": 473.963, "r_x2": 469.001, "r_y2": 465.411, "r_x3": 439.113, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "starting", "orig": "starting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 473.713, "r_y0": 473.963, "r_x1": 545.115, "r_y1": 473.963, "r_x2": 545.115, "r_y2": 465.411, "r_x3": 473.713, "r_y3": 465.411, "coord_origin": "TOPLEFT"}, "text": "from an encoded", "orig": "from an encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 485.918, "r_x1": 335.701, "r_y1": 485.918, "r_x2": 335.701, "r_y2": 477.366, "r_x3": 308.862, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "image.", "orig": "image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.853, "r_y0": 485.918, "r_x1": 411.009, "r_y1": 485.918, "r_x2": 411.009, "r_y2": 477.366, "r_x3": 345.853, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "Such sequences", "orig": "Such sequences", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 415.85, "r_y0": 485.918, "r_x1": 424.149, "r_y1": 485.918, "r_x2": 424.149, "r_y2": 477.366, "r_x3": 415.85, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.001, "r_y0": 485.918, "r_x1": 454.914, "r_y1": 485.918, "r_x2": 454.914, "r_y2": 477.366, "r_x3": 429.001, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "tokens", "orig": "tokens", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.756, "r_y0": 485.918, "r_x1": 473.584, "r_y1": 485.918, "r_x2": 473.584, "r_y2": 477.366, "r_x3": 459.756, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "can", "orig": "can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 478.425, "r_y0": 485.918, "r_x1": 487.83, "r_y1": 485.918, "r_x2": 487.83, "r_y2": 477.366, "r_x3": 478.425, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "be", "orig": "be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 492.682, "r_y0": 485.918, "r_x1": 545.115, "r_y1": 485.918, "r_x2": 545.115, "r_y2": 477.366, "r_x3": 492.682, "r_y3": 477.366, "coord_origin": "TOPLEFT"}, "text": "HTML table", "orig": "HTML table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 497.873, "r_x1": 459.218, "r_y1": 497.873, "r_x2": 459.218, "r_y2": 489.321, "r_x3": 308.862, "r_y3": 489.321, "coord_origin": "TOPLEFT"}, "text": "tags [37, 17] or LaTeX symbols[10].", "orig": "tags [37, 17] or LaTeX symbols[10].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.115, "r_y0": 497.873, "r_x1": 545.115, "r_y1": 497.873, "r_x2": 545.115, "r_y2": 489.321, "r_x3": 465.115, "r_y3": 489.321, "coord_origin": "TOPLEFT"}, "text": "The choice of sym-", "orig": "The choice of sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 509.828, "r_x1": 545.115, "r_y1": 509.828, "r_x2": 545.115, "r_y2": 501.276, "r_x3": 308.862, "r_y3": 501.276, "coord_origin": "TOPLEFT"}, "text": "bols is ultimately not very important, since one can be trans-", "orig": "bols is ultimately not very important, since one can be trans-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 521.784, "r_x1": 396.692, "r_y1": 521.784, "r_x2": 396.692, "r_y2": 513.232, "r_x3": 308.862, "r_y3": 513.232, "coord_origin": "TOPLEFT"}, "text": "formed into the other.", "orig": "formed into the other.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.265, "r_y0": 521.784, "r_x1": 545.115, "r_y1": 521.784, "r_x2": 545.115, "r_y2": 513.232, "r_x3": 401.265, "r_y3": 513.232, "coord_origin": "TOPLEFT"}, "text": "There are however subtle variations", "orig": "There are however subtle variations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.739, "r_x1": 433.484, "r_y1": 533.739, "r_x2": 433.484, "r_y2": 525.187, "r_x3": 308.862, "r_y3": 525.187, "coord_origin": "TOPLEFT"}, "text": "in the Image-to-Text networks.", "orig": "in the Image-to-Text networks.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 438.187, "r_y0": 533.739, "r_x1": 545.115, "r_y1": 533.739, "r_x2": 545.115, "r_y2": 525.187, "r_x3": 438.187, "r_y3": 525.187, "coord_origin": "TOPLEFT"}, "text": "The easiest network archi-", "orig": "The easiest network archi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.694, "r_x1": 420.941, "r_y1": 545.694, "r_x2": 420.941, "r_y2": 537.142, "r_x3": 308.862, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "tectures are 'image-encoder", "orig": "tectures are 'image-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.595, "r_y0": 545.388, "r_x1": 433.558, "r_y1": 545.388, "r_x2": 433.558, "r_y2": 536.8240000000001, "r_x3": 423.595, "r_y3": 536.8240000000001, "coord_origin": "TOPLEFT"}, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.212, "r_y0": 545.694, "r_x1": 545.113, "r_y1": 545.694, "r_x2": 545.113, "r_y2": 537.142, "r_x3": 436.212, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "text-decoder' (IETD), sim-", "orig": "text-decoder' (IETD), sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 557.649, "r_x1": 545.115, "r_y1": 557.649, "r_x2": 545.115, "r_y2": 549.097, "r_x3": 308.862, "r_y3": 549.097, "coord_origin": "TOPLEFT"}, "text": "ilar to network architectures that try to provide captions to", "orig": "ilar to network architectures that try to provide captions to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.604, "r_x1": 545.115, "r_y1": 569.604, "r_x2": 545.115, "r_y2": 561.052, "r_x3": 308.862, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "images [32]. In these IETD networks, one expects as output", "orig": "images [32]. In these IETD networks, one expects as output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 581.559, "r_x1": 503.671, "r_y1": 581.559, "r_x2": 503.671, "r_y2": 573.0070000000001, "r_x3": 308.862, "r_y3": 573.0070000000001, "coord_origin": "TOPLEFT"}, "text": "the LaTeX/HTML string of the entire table, i.e.", "orig": "the LaTeX/HTML string of the entire table, i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 509.579, "r_y0": 581.559, "r_x1": 545.115, "r_y1": 581.559, "r_x2": 545.115, "r_y2": 573.0070000000001, "r_x3": 509.579, "r_y3": 573.0070000000001, "coord_origin": "TOPLEFT"}, "text": "the sym-", "orig": "the sym-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 593.515, "r_x1": 545.115, "r_y1": 593.515, "r_x2": 545.115, "r_y2": 584.963, "r_x3": 308.862, "r_y3": 584.963, "coord_origin": "TOPLEFT"}, "text": "bols necessary for creating the table with the content of the", "orig": "bols necessary for creating the table with the content of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.47, "r_x1": 330.72, "r_y1": 605.47, "r_x2": 330.72, "r_y2": 596.918, "r_x3": 308.862, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "table.", "orig": "table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.536, "r_y0": 605.47, "r_x1": 497.075, "r_y1": 605.47, "r_x2": 497.075, "r_y2": 596.918, "r_x3": 334.536, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "Another approach is the 'image-encoder", "orig": "Another approach is the 'image-encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 499.805, "r_y0": 605.164, "r_x1": 509.768, "r_y1": 605.164, "r_x2": 509.768, "r_y2": 596.6, "r_x3": 499.805, "r_y3": 596.6, "coord_origin": "TOPLEFT"}, "text": "\u2192", "orig": "\u2192", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.501, "r_y0": 605.47, "r_x1": 545.109, "r_y1": 605.47, "r_x2": 545.109, "r_y2": 596.918, "r_x3": 512.501, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "dual de-", "orig": "dual de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.425, "r_x1": 545.115, "r_y1": 617.425, "r_x2": 545.115, "r_y2": 608.873, "r_x3": 308.862, "r_y3": 608.873, "coord_origin": "TOPLEFT"}, "text": "coder' (IEDD) networks. In these type of networks, one has", "orig": "coder' (IEDD) networks. In these type of networks, one has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.38, "r_x1": 545.115, "r_y1": 629.38, "r_x2": 545.115, "r_y2": 620.828, "r_x3": 308.862, "r_y3": 620.828, "coord_origin": "TOPLEFT"}, "text": "two consecutive decoders with different purposes. The first", "orig": "two consecutive decoders with different purposes. The first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.335, "r_x1": 364.782, "r_y1": 641.335, "r_x2": 364.782, "r_y2": 632.783, "r_x3": 308.862, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "decoder is the", "orig": "decoder is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.574, "r_y0": 641.192, "r_x1": 415.614, "r_y1": 641.192, "r_x2": 415.614, "r_y2": 632.604, "r_x3": 367.574, "r_y3": 632.604, "coord_origin": "TOPLEFT"}, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 415.613, "r_y0": 641.335, "r_x1": 418.104, "r_y1": 641.335, "r_x2": 418.104, "r_y2": 632.783, "r_x3": 415.613, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 420.963, "r_y0": 641.335, "r_x1": 433.137, "r_y1": 641.335, "r_x2": 433.137, "r_y2": 632.783, "r_x3": 420.963, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "i.e.", "orig": "i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.122, "r_y0": 641.335, "r_x1": 442.661, "r_y1": 641.335, "r_x2": 442.661, "r_y2": 632.783, "r_x3": 437.122, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 445.441, "r_y0": 641.335, "r_x1": 545.117, "r_y1": 641.335, "r_x2": 545.117, "r_y2": 632.783, "r_x3": 445.441, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "only produces the HTM-", "orig": "only produces the HTM-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.29, "r_x1": 545.115, "r_y1": 653.29, "r_x2": 545.115, "r_y2": 644.738, "r_x3": 308.862, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "L/LaTeX tags which construct an empty table. The second", "orig": "L/LaTeX tags which construct an empty table. The second", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 665.103, "r_x1": 373.599, "r_y1": 665.103, "r_x2": 373.599, "r_y2": 656.515, "r_x3": 308.862, "r_y3": 656.515, "coord_origin": "TOPLEFT"}, "text": "content-decoder", "orig": "content-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.907, "r_y0": 665.246, "r_x1": 545.116, "r_y1": 665.246, "r_x2": 545.116, "r_y2": 656.694, "r_x3": 376.907, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "uses the encoding of the image in combi-", "orig": "uses the encoding of the image in combi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 308.862, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "nation with the output encoding of each cell-tag (from the", "orig": "nation with the output encoding of each cell-tag (from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.013, "r_x1": 356.902, "r_y1": 689.013, "r_x2": 356.902, "r_y2": 680.425, "r_x3": 308.862, "r_y3": 680.425, "coord_origin": "TOPLEFT"}, "text": "tag-decoder", "orig": "tag-decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.131, "r_y0": 689.156, "r_x1": 360.449, "r_y1": 689.156, "r_x2": 360.449, "r_y2": 680.604, "r_x3": 357.131, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 364.045, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 364.045, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "to generate the textual content of each table", "orig": "to generate the textual content of each table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 325.739, "r_y1": 701.111, "r_x2": 325.739, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "cell.", "orig": "cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.746, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 331.746, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "The network architecture of IEDD is certainly more", "orig": "The network architecture of IEDD is certainly more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "elaborate, but it has the advantage that one can pre-train the", "orig": "elaborate, but it has the advantage that one can pre-train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Image-to-Text networks : In this type of network, one predicts a sequence of tokens starting from an encoded image. Such sequences of tokens can be HTML table tags [37, 17] or LaTeX symbols[10]. The choice of symbols is ultimately not very important, since one can be transformed into the other. There are however subtle variations in the Image-to-Text networks. The easiest network architectures are 'image-encoder \u2192 text-decoder' (IETD), similar to network architectures that try to provide captions to images [32]. In these IETD networks, one expects as output the LaTeX/HTML string of the entire table, i.e. the symbols necessary for creating the table with the content of the table. Another approach is the 'image-encoder \u2192 dual decoder' (IEDD) networks. In these type of networks, one has two consecutive decoders with different purposes. The first decoder is the tag-decoder , i.e. it only produces the HTML/LaTeX tags which construct an empty table. The second content-decoder uses the encoding of the image in combination with the output encoding of each cell-tag (from the tag-decoder ) to generate the textual content of each table cell. The network architecture of IEDD is certainly more elaborate, but it has the advantage that one can pre-train the"}], "headers": [{"label": "page_footer", "id": 15, "page_no": 1, "cluster": {"id": 15, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8778094053268433, "cells": [{"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2"}]}}, {"page_no": 2, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 250.151, "r_y1": 84.029, "r_x2": 250.151, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "tag-decoder which is constrained to the table-tags.", "orig": "tag-decoder which is constrained to the table-tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 96.03999999999996, "r_x1": 70.366, "r_y1": 96.03999999999996, "r_x2": 70.366, "r_y2": 87.48800000000006, "r_x3": 62.067, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.931, "r_y0": 96.03999999999996, "r_x1": 110.953, "r_y1": 96.03999999999996, "r_x2": 110.953, "r_y2": 87.48800000000006, "r_x3": 76.931, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "practice,", "orig": "practice,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 118.545, "r_y0": 96.03999999999996, "r_x1": 136.258, "r_y1": 96.03999999999996, "r_x2": 136.258, "r_y2": 87.48800000000006, "r_x3": 118.545, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "both", "orig": "both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.824, "r_y0": 96.03999999999996, "r_x1": 175.372, "r_y1": 96.03999999999996, "r_x2": 175.372, "r_y2": 87.48800000000006, "r_x3": 142.824, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.947, "r_y0": 96.03999999999996, "r_x1": 232.836, "r_y1": 96.03999999999996, "r_x2": 232.836, "r_y2": 87.48800000000006, "r_x3": 181.947, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "architectures", "orig": "architectures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.411, "r_y0": 96.03999999999996, "r_x1": 265.414, "r_y1": 96.03999999999996, "r_x2": 265.414, "r_y2": 87.48800000000006, "r_x3": 239.411, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "(IETD", "orig": "(IETD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.979, "r_y0": 96.03999999999996, "r_x1": 286.365, "r_y1": 96.03999999999996, "r_x2": 286.365, "r_y2": 87.48800000000006, "r_x3": 271.979, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 107.995, "r_x1": 286.365, "r_y1": 107.995, "r_x2": 286.365, "r_y2": 99.44299999999998, "r_x3": 50.112, "r_y3": 99.44299999999998, "coord_origin": "TOPLEFT"}, "text": "IEDD) require an implicit, custom trained object-character-", "orig": "IEDD) require an implicit, custom trained object-character-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 119.95100000000002, "r_x1": 286.365, "r_y1": 119.95100000000002, "r_x2": 286.365, "r_y2": 111.399, "r_x3": 50.112, "r_y3": 111.399, "coord_origin": "TOPLEFT"}, "text": "recognition (OCR) to obtain the content of the table-cells.", "orig": "recognition (OCR) to obtain the content of the table-cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 131.90599999999995, "r_x1": 286.365, "r_y1": 131.90599999999995, "r_x2": 286.365, "r_y2": 123.35400000000004, "r_x3": 50.112, "r_y3": 123.35400000000004, "coord_origin": "TOPLEFT"}, "text": "In the case of IETD, this OCR engine is implicit in the de-", "orig": "In the case of IETD, this OCR engine is implicit in the de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 143.861, "r_x1": 286.365, "r_y1": 143.861, "r_x2": 286.365, "r_y2": 135.30899999999997, "r_x3": 50.112, "r_y3": 135.30899999999997, "coord_origin": "TOPLEFT"}, "text": "coder similar to [24]. For the IEDD, the OCR is solely em-", "orig": "coder similar to [24]. For the IEDD, the OCR is solely em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 155.81600000000003, "r_x1": 174.206, "r_y1": 155.81600000000003, "r_x2": 174.206, "r_y2": 147.264, "r_x3": 50.112, "r_y3": 147.264, "coord_origin": "TOPLEFT"}, "text": "bedded in the content-decoder.", "orig": "bedded in the content-decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 179.098, "r_y0": 155.81600000000003, "r_x1": 286.365, "r_y1": 155.81600000000003, "r_x2": 286.365, "r_y2": 147.264, "r_x3": 179.098, "r_y3": 147.264, "coord_origin": "TOPLEFT"}, "text": "This reliance on a custom,", "orig": "This reliance on a custom,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 167.77099999999996, "r_x1": 243.267, "r_y1": 167.77099999999996, "r_x2": 243.267, "r_y2": 159.21900000000005, "r_x3": 50.112, "r_y3": 159.21900000000005, "coord_origin": "TOPLEFT"}, "text": "implicit OCR decoder is of course problematic.", "orig": "implicit OCR decoder is of course problematic.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.437, "r_y0": 167.77099999999996, "r_x1": 286.365, "r_y1": 167.77099999999996, "r_x2": 286.365, "r_y2": 159.21900000000005, "r_x3": 248.437, "r_y3": 159.21900000000005, "coord_origin": "TOPLEFT"}, "text": "OCR is a", "orig": "OCR is a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 179.726, "r_x1": 286.365, "r_y1": 179.726, "r_x2": 286.365, "r_y2": 171.17399999999998, "r_x3": 50.112, "r_y3": 171.17399999999998, "coord_origin": "TOPLEFT"}, "text": "well known and extremely tough problem, that often needs", "orig": "well known and extremely tough problem, that often needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 191.68200000000002, "r_x1": 286.365, "r_y1": 191.68200000000002, "r_x2": 286.365, "r_y2": 183.13, "r_x3": 50.112, "r_y3": 183.13, "coord_origin": "TOPLEFT"}, "text": "custom training for each individual language. However, the", "orig": "custom training for each individual language. However, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 203.63699999999994, "r_x1": 126.655, "r_y1": 203.63699999999994, "r_x2": 126.655, "r_y2": 195.08500000000004, "r_x3": 50.112, "r_y3": 195.08500000000004, "coord_origin": "TOPLEFT"}, "text": "limited availability", "orig": "limited availability", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 130.59, "r_y0": 203.63699999999994, "r_x1": 142.206, "r_y1": 203.63699999999994, "r_x2": 142.206, "r_y2": 195.08500000000004, "r_x3": 130.59, "r_y3": 195.08500000000004, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 146.132, "r_y0": 203.63699999999994, "r_x1": 286.365, "r_y1": 203.63699999999994, "r_x2": 286.365, "r_y2": 195.08500000000004, "r_x3": 146.132, "r_y3": 195.08500000000004, "coord_origin": "TOPLEFT"}, "text": "non-english content in the current", "orig": "non-english content in the current", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 215.59199999999998, "r_x1": 286.365, "r_y1": 215.59199999999998, "r_x2": 286.365, "r_y2": 207.03999999999996, "r_x3": 50.112, "r_y3": 207.03999999999996, "coord_origin": "TOPLEFT"}, "text": "datasets, makes it impractical to apply the IETD and IEDD", "orig": "datasets, makes it impractical to apply the IETD and IEDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 227.54700000000003, "r_x1": 286.365, "r_y1": 227.54700000000003, "r_x2": 286.365, "r_y2": 218.995, "r_x3": 50.112, "r_y3": 218.995, "coord_origin": "TOPLEFT"}, "text": "methods on tables with other languages. Additionally, OCR", "orig": "methods on tables with other languages. Additionally, OCR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 239.50199999999995, "r_x1": 286.365, "r_y1": 239.50199999999995, "r_x2": 286.365, "r_y2": 230.95000000000005, "r_x3": 50.112, "r_y3": 230.95000000000005, "coord_origin": "TOPLEFT"}, "text": "can be completely omitted if the tables originate from pro-", "orig": "can be completely omitted if the tables originate from pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 251.457, "r_x1": 286.365, "r_y1": 251.457, "r_x2": 286.365, "r_y2": 242.90499999999997, "r_x3": 50.112, "r_y3": 242.90499999999997, "coord_origin": "TOPLEFT"}, "text": "grammatic PDF documents with known positions of each", "orig": "grammatic PDF documents with known positions of each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 263.413, "r_x1": 66.989, "r_y1": 263.413, "r_x2": 66.989, "r_y2": 254.861, "r_x3": 50.112, "r_y3": 254.861, "coord_origin": "TOPLEFT"}, "text": "cell.", "orig": "cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 71.382, "r_y0": 263.413, "r_x1": 286.365, "r_y1": 263.413, "r_x2": 286.365, "r_y2": 254.861, "r_x3": 71.382, "r_y3": 254.861, "coord_origin": "TOPLEFT"}, "text": "The latter was the inspiration for the work of this pa-", "orig": "The latter was the inspiration for the work of this pa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 275.36800000000005, "r_x1": 64.777, "r_y1": 275.36800000000005, "r_x2": 64.777, "r_y2": 266.81600000000003, "r_x3": 50.112, "r_y3": 266.81600000000003, "coord_origin": "TOPLEFT"}, "text": "per.", "orig": "per.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 287.395, "r_x1": 90.301, "r_y1": 287.395, "r_x2": 90.301, "r_y2": 278.43899999999996, "r_x3": 62.067, "r_y3": 278.43899999999996, "coord_origin": "TOPLEFT"}, "text": "Graph", "orig": "Graph", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.677, "r_y0": 287.395, "r_x1": 126.007, "r_y1": 287.395, "r_x2": 126.007, "r_y2": 278.43899999999996, "r_x3": 96.677, "r_y3": 278.43899999999996, "coord_origin": "TOPLEFT"}, "text": "Neural", "orig": "Neural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.373, "r_y0": 287.395, "r_x1": 171.566, "r_y1": 287.395, "r_x2": 171.566, "r_y2": 278.43899999999996, "r_x3": 132.373, "r_y3": 278.43899999999996, "coord_origin": "TOPLEFT"}, "text": "networks", "orig": "networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.568, "r_y0": 287.379, "r_x1": 174.338, "r_y1": 287.379, "r_x2": 174.338, "r_y2": 278.827, "r_x3": 171.568, "r_y3": 278.827, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.187, "r_y0": 287.379, "r_x1": 210.083, "r_y1": 287.379, "r_x2": 210.083, "r_y2": 278.827, "r_x3": 185.187, "r_y3": 278.827, "coord_origin": "TOPLEFT"}, "text": "Graph", "orig": "Graph", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.459, "r_y0": 287.379, "r_x1": 243.568, "r_y1": 287.379, "r_x2": 243.568, "r_y2": 278.827, "r_x3": 216.459, "r_y3": 278.827, "coord_origin": "TOPLEFT"}, "text": "Neural", "orig": "Neural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.944, "r_y0": 287.379, "r_x1": 286.357, "r_y1": 287.379, "r_x2": 286.357, "r_y2": 278.827, "r_x3": 249.944, "r_y3": 278.827, "coord_origin": "TOPLEFT"}, "text": "networks", "orig": "networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 299.335, "r_x1": 84.971, "r_y1": 299.335, "r_x2": 84.971, "r_y2": 290.783, "r_x3": 50.112, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "(GNN's)", "orig": "(GNN's)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.347, "r_y0": 299.335, "r_x1": 107.845, "r_y1": 299.335, "r_x2": 107.845, "r_y2": 290.783, "r_x3": 91.347, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "take", "orig": "take", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 114.211, "r_y0": 299.335, "r_x1": 118.635, "r_y1": 299.335, "r_x2": 118.635, "r_y2": 290.783, "r_x3": 114.211, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.011, "r_y0": 299.335, "r_x1": 159.87, "r_y1": 299.335, "r_x2": 159.87, "r_y2": 290.783, "r_x3": 125.011, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "radically", "orig": "radically", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.246, "r_y0": 299.335, "r_x1": 200.298, "r_y1": 299.335, "r_x2": 200.298, "r_y2": 290.783, "r_x3": 166.246, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "different", "orig": "different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.664, "r_y0": 299.335, "r_x1": 243.177, "r_y1": 299.335, "r_x2": 243.177, "r_y2": 290.783, "r_x3": 206.664, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "approach", "orig": "approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.553, "r_y0": 299.335, "r_x1": 257.304, "r_y1": 299.335, "r_x2": 257.304, "r_y2": 290.783, "r_x3": 249.553, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.68, "r_y0": 299.335, "r_x1": 286.365, "r_y1": 299.335, "r_x2": 286.365, "r_y2": 290.783, "r_x3": 263.68, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "table-", "orig": "table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 311.29, "r_x1": 84.971, "r_y1": 311.29, "r_x2": 84.971, "r_y2": 302.738, "r_x3": 50.112, "r_y3": 302.738, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.986, "r_y0": 311.29, "r_x1": 131.168, "r_y1": 311.29, "r_x2": 131.168, "r_y2": 302.738, "r_x3": 88.986, "r_y3": 302.738, "coord_origin": "TOPLEFT"}, "text": "extraction.", "orig": "extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.849, "r_y0": 311.29, "r_x1": 286.365, "r_y1": 311.29, "r_x2": 286.365, "r_y2": 302.738, "r_x3": 138.849, "r_y3": 302.738, "coord_origin": "TOPLEFT"}, "text": "Note that one table cell can consti-", "orig": "Note that one table cell can consti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 323.245, "r_x1": 286.365, "r_y1": 323.245, "r_x2": 286.365, "r_y2": 314.693, "r_x3": 50.112, "r_y3": 314.693, "coord_origin": "TOPLEFT"}, "text": "tute out of multiple text-cells. To obtain the table-structure,", "orig": "tute out of multiple text-cells. To obtain the table-structure,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 335.2, "r_x1": 136.996, "r_y1": 335.2, "r_x2": 136.996, "r_y2": 326.648, "r_x3": 50.112, "r_y3": 326.648, "coord_origin": "TOPLEFT"}, "text": "one creates an initial", "orig": "one creates an initial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.051, "r_y0": 335.2, "r_x1": 166.226, "r_y1": 335.2, "r_x2": 166.226, "r_y2": 326.648, "r_x3": 141.051, "r_y3": 326.648, "coord_origin": "TOPLEFT"}, "text": "graph,", "orig": "graph,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.679, "r_y0": 335.2, "r_x1": 286.365, "r_y1": 335.2, "r_x2": 286.365, "r_y2": 326.648, "r_x3": 170.679, "r_y3": 326.648, "coord_origin": "TOPLEFT"}, "text": "where each of the text-cells", "orig": "where each of the text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 347.155, "r_x1": 260.442, "r_y1": 347.155, "r_x2": 260.442, "r_y2": 338.603, "r_x3": 50.112, "r_y3": 338.603, "coord_origin": "TOPLEFT"}, "text": "becomes a node in the graph similar to [33, 34, 2].", "orig": "becomes a node in the graph similar to [33, 34, 2].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.45, "r_y0": 347.155, "r_x1": 286.365, "r_y1": 347.155, "r_x2": 286.365, "r_y2": 338.603, "r_x3": 266.45, "r_y3": 338.603, "coord_origin": "TOPLEFT"}, "text": "Each", "orig": "Each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 359.11, "r_x1": 286.365, "r_y1": 359.11, "r_x2": 286.365, "r_y2": 350.558, "r_x3": 50.112, "r_y3": 350.558, "coord_origin": "TOPLEFT"}, "text": "node is then associated with en embedding vector coming", "orig": "node is then associated with en embedding vector coming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 371.066, "r_x1": 286.365, "r_y1": 371.066, "r_x2": 286.365, "r_y2": 362.514, "r_x3": 50.112, "r_y3": 362.514, "coord_origin": "TOPLEFT"}, "text": "from the encoded image, its coordinates and the encoded", "orig": "from the encoded image, its coordinates and the encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 383.021, "r_x1": 67.397, "r_y1": 383.021, "r_x2": 67.397, "r_y2": 374.469, "r_x3": 50.112, "r_y3": 374.469, "coord_origin": "TOPLEFT"}, "text": "text.", "orig": "text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 72.976, "r_y0": 383.021, "r_x1": 286.365, "r_y1": 383.021, "r_x2": 286.365, "r_y2": 374.469, "r_x3": 72.976, "r_y3": 374.469, "coord_origin": "TOPLEFT"}, "text": "Furthermore, nodes that represent adjacent text-cells", "orig": "Furthermore, nodes that represent adjacent text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 394.976, "r_x1": 92.602, "r_y1": 394.976, "r_x2": 92.602, "r_y2": 386.424, "r_x3": 50.112, "r_y3": 386.424, "coord_origin": "TOPLEFT"}, "text": "are linked.", "orig": "are linked.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 97.305, "r_y0": 394.976, "r_x1": 286.365, "r_y1": 394.976, "r_x2": 286.365, "r_y2": 386.424, "r_x3": 97.305, "r_y3": 386.424, "coord_origin": "TOPLEFT"}, "text": "Graph Convolutional Networks (GCN's) based", "orig": "Graph Convolutional Networks (GCN's) based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 406.931, "r_x1": 286.365, "r_y1": 406.931, "r_x2": 286.365, "r_y2": 398.379, "r_x3": 50.112, "r_y3": 398.379, "coord_origin": "TOPLEFT"}, "text": "methods take the image as an input, but also the position of", "orig": "methods take the image as an input, but also the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 418.886, "r_x1": 286.365, "r_y1": 418.886, "r_x2": 286.365, "r_y2": 410.334, "r_x3": 50.112, "r_y3": 410.334, "coord_origin": "TOPLEFT"}, "text": "the text-cells and their content [18]. The purpose of a GCN", "orig": "the text-cells and their content [18]. The purpose of a GCN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 430.841, "r_x1": 286.365, "r_y1": 430.841, "r_x2": 286.365, "r_y2": 422.289, "r_x3": 50.112, "r_y3": 422.289, "coord_origin": "TOPLEFT"}, "text": "is to transform the input graph into a new graph, which re-", "orig": "is to transform the input graph into a new graph, which re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 442.797, "r_x1": 198.236, "r_y1": 442.797, "r_x2": 198.236, "r_y2": 434.245, "r_x3": 50.112, "r_y3": 434.245, "coord_origin": "TOPLEFT"}, "text": "places the old links with new ones.", "orig": "places the old links with new ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 205.927, "r_y0": 442.797, "r_x1": 286.365, "r_y1": 442.797, "r_x2": 286.365, "r_y2": 434.245, "r_x3": 205.927, "r_y3": 434.245, "coord_origin": "TOPLEFT"}, "text": "The new links then", "orig": "The new links then", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 454.752, "r_x1": 165.618, "r_y1": 454.752, "r_x2": 165.618, "r_y2": 446.2, "r_x3": 50.112, "r_y3": 446.2, "coord_origin": "TOPLEFT"}, "text": "represent the table-structure.", "orig": "represent the table-structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.417, "r_y0": 454.752, "r_x1": 286.365, "r_y1": 454.752, "r_x2": 286.365, "r_y2": 446.2, "r_x3": 171.417, "r_y3": 446.2, "coord_origin": "TOPLEFT"}, "text": "With this approach, one can", "orig": "With this approach, one can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 466.707, "r_x1": 242.36, "r_y1": 466.707, "r_x2": 242.36, "r_y2": 458.155, "r_x3": 50.112, "r_y3": 458.155, "coord_origin": "TOPLEFT"}, "text": "avoid the need to build custom OCR decoders.", "orig": "avoid the need to build custom OCR decoders.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.408, "r_y0": 466.707, "r_x1": 286.365, "r_y1": 466.707, "r_x2": 286.365, "r_y2": 458.155, "r_x3": 248.408, "r_y3": 458.155, "coord_origin": "TOPLEFT"}, "text": "However,", "orig": "However,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 478.662, "r_x1": 286.365, "r_y1": 478.662, "r_x2": 286.365, "r_y2": 470.11, "r_x3": 50.112, "r_y3": 470.11, "coord_origin": "TOPLEFT"}, "text": "the quality of the reconstructed structure is not comparable", "orig": "the quality of the reconstructed structure is not comparable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 490.617, "r_x1": 186.5, "r_y1": 490.617, "r_x2": 186.5, "r_y2": 482.065, "r_x3": 50.112, "r_y3": 482.065, "coord_origin": "TOPLEFT"}, "text": "to the current state-of-the-art [18].", "orig": "to the current state-of-the-art [18].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 502.645, "r_x1": 252.881, "r_y1": 502.645, "r_x2": 252.881, "r_y2": 493.689, "r_x3": 62.067, "r_y3": 493.689, "coord_origin": "TOPLEFT"}, "text": "Hybrid Deep Learning-Rule-Based approach", "orig": "Hybrid Deep Learning-Rule-Based approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 252.882, "r_y0": 502.629, "r_x1": 255.652, "r_y1": 502.629, "r_x2": 255.652, "r_y2": 494.077, "r_x3": 252.882, "r_y3": 494.077, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 258.63, "r_y0": 502.629, "r_x1": 286.366, "r_y1": 502.629, "r_x2": 286.366, "r_y2": 494.077, "r_x3": 258.63, "r_y3": 494.077, "coord_origin": "TOPLEFT"}, "text": "Apop-", "orig": "Apop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 514.5840000000001, "r_x1": 286.365, "r_y1": 514.5840000000001, "r_x2": 286.365, "r_y2": 506.032, "r_x3": 50.112, "r_y3": 506.032, "coord_origin": "TOPLEFT"}, "text": "ular current model for table-structure identification is the", "orig": "ular current model for table-structure identification is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 526.539, "r_x1": 286.365, "r_y1": 526.539, "r_x2": 286.365, "r_y2": 517.9870000000001, "r_x3": 50.112, "r_y3": 517.9870000000001, "coord_origin": "TOPLEFT"}, "text": "use of a hybrid Deep Learning-Rule-Based approach similar", "orig": "use of a hybrid Deep Learning-Rule-Based approach similar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 538.494, "r_x1": 286.365, "r_y1": 538.494, "r_x2": 286.365, "r_y2": 529.942, "r_x3": 50.112, "r_y3": 529.942, "coord_origin": "TOPLEFT"}, "text": "to [27, 29]. In this approach, one first detects the position of", "orig": "to [27, 29]. In this approach, one first detects the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 550.45, "r_x1": 286.365, "r_y1": 550.45, "r_x2": 286.365, "r_y2": 541.898, "r_x3": 50.112, "r_y3": 541.898, "coord_origin": "TOPLEFT"}, "text": "the table-cells with object detection (e.g. YoloVx or Mask-", "orig": "the table-cells with object detection (e.g. YoloVx or Mask-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 562.405, "r_x1": 286.365, "r_y1": 562.405, "r_x2": 286.365, "r_y2": 553.8530000000001, "r_x3": 50.112, "r_y3": 553.8530000000001, "coord_origin": "TOPLEFT"}, "text": "RCNN), then classifies the table into different types (from", "orig": "RCNN), then classifies the table into different types (from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 574.36, "r_x1": 59.527, "r_y1": 574.36, "r_x2": 59.527, "r_y2": 565.808, "r_x3": 50.112, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "its", "orig": "its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 64.259, "r_y0": 574.36, "r_x1": 95.8, "r_y1": 574.36, "r_x2": 95.8, "r_y2": 565.808, "r_x3": 64.259, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "images)", "orig": "images)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 100.523, "r_y0": 574.36, "r_x1": 145.105, "r_y1": 574.36, "r_x2": 145.105, "r_y2": 565.808, "r_x3": 100.523, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "and finally", "orig": "and finally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.828, "r_y0": 574.36, "r_x1": 166.983, "r_y1": 574.36, "r_x2": 166.983, "r_y2": 565.808, "r_x3": 149.828, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "uses", "orig": "uses", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.715, "r_y0": 574.36, "r_x1": 205.768, "r_y1": 574.36, "r_x2": 205.768, "r_y2": 565.808, "r_x3": 171.715, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "different", "orig": "different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.5, "r_y0": 574.36, "r_x1": 244.243, "r_y1": 574.36, "r_x2": 244.243, "r_y2": 565.808, "r_x3": 210.5, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "rule-sets", "orig": "rule-sets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.975, "r_y0": 574.36, "r_x1": 256.726, "r_y1": 574.36, "r_x2": 256.726, "r_y2": 565.808, "r_x3": 248.975, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 261.459, "r_y0": 574.36, "r_x1": 286.365, "r_y1": 574.36, "r_x2": 286.365, "r_y2": 565.808, "r_x3": 261.459, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "obtain", "orig": "obtain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 586.315, "r_x1": 122.64, "r_y1": 586.315, "r_x2": 122.64, "r_y2": 577.763, "r_x3": 50.112, "r_y3": 577.763, "coord_origin": "TOPLEFT"}, "text": "its table-structure.", "orig": "its table-structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 127.482, "r_y0": 586.315, "r_x1": 286.365, "r_y1": 586.315, "r_x2": 286.365, "r_y2": 577.763, "r_x3": 127.482, "r_y3": 577.763, "coord_origin": "TOPLEFT"}, "text": "Currently, this approach achieves state-", "orig": "Currently, this approach achieves state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 598.27, "r_x1": 87.731, "r_y1": 598.27, "r_x2": 87.731, "r_y2": 589.718, "r_x3": 50.112, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "of-the-art", "orig": "of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.074, "r_y0": 598.27, "r_x1": 120.577, "r_y1": 598.27, "r_x2": 120.577, "r_y2": 589.718, "r_x3": 92.074, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "results,", "orig": "results,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.389, "r_y0": 598.27, "r_x1": 137.922, "r_y1": 598.27, "r_x2": 137.922, "r_y2": 589.718, "r_x3": 125.389, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "but", "orig": "but", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.266, "r_y0": 598.27, "r_x1": 148.911, "r_y1": 598.27, "r_x2": 148.911, "r_y2": 589.718, "r_x3": 142.266, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.255, "r_y0": 598.27, "r_x1": 165.987, "r_y1": 598.27, "r_x2": 165.987, "r_y2": 589.718, "r_x3": 153.255, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "not", "orig": "not", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.331, "r_y0": 598.27, "r_x1": 286.365, "r_y1": 598.27, "r_x2": 286.365, "r_y2": 589.718, "r_x3": 170.331, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "an end-to-end deep-learning", "orig": "an end-to-end deep-learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 610.225, "r_x1": 82.49, "r_y1": 610.225, "r_x2": 82.49, "r_y2": 601.673, "r_x3": 50.112, "r_y3": 601.673, "coord_origin": "TOPLEFT"}, "text": "method.", "orig": "method.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.173, "r_y0": 610.225, "r_x1": 286.365, "r_y1": 610.225, "r_x2": 286.365, "r_y2": 601.673, "r_x3": 87.173, "r_y3": 601.673, "coord_origin": "TOPLEFT"}, "text": "As such, new rules need to be written if different", "orig": "As such, new rules need to be written if different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 622.181, "r_x1": 175.989, "r_y1": 622.181, "r_x2": 175.989, "r_y2": 613.629, "r_x3": 50.112, "r_y3": 613.629, "coord_origin": "TOPLEFT"}, "text": "types of tables are encountered.", "orig": "types of tables are encountered.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 646.693, "r_x1": 105.225, "r_y1": 646.693, "r_x2": 105.225, "r_y2": 635.9449999999999, "r_x3": 50.112, "r_y3": 635.9449999999999, "coord_origin": "TOPLEFT"}, "text": "3. Datasets", "orig": "3. Datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 665.246, "r_x1": 286.365, "r_y1": 665.246, "r_x2": 286.365, "r_y2": 656.694, "r_x3": 62.067, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "We rely on large-scale datasets such as PubTabNet [37],", "orig": "We rely on large-scale datasets such as PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.201, "r_x1": 286.365, "r_y1": 677.201, "r_x2": 286.365, "r_y2": 668.649, "r_x3": 50.112, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "FinTabNet [36], and TableBank [17] datasets to train and", "orig": "FinTabNet [36], and TableBank [17] datasets to train and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 133.479, "r_y1": 689.156, "r_x2": 133.479, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "evaluate our models.", "orig": "evaluate our models.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.271, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 138.271, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "These datasets span over various ap-", "orig": "These datasets span over various ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 166.246, "r_y1": 701.111, "r_x2": 166.246, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "pearance styles and content.", "orig": "pearance styles and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 173.688, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 173.688, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "We also introduce our own", "orig": "We also introduce our own", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "synthetically generated SynthTabNet dataset to fix an im-", "orig": "synthetically generated SynthTabNet dataset to fix an im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.799, "r_y0": 88.46699999999998, "r_x1": 486.849, "r_y1": 88.46699999999998, "r_x2": 486.849, "r_y2": 80.154, "r_x3": 380.799, "r_y3": 80.154, "coord_origin": "TOPLEFT"}, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.768, "r_y0": 250.68200000000002, "r_x1": 469.787, "r_y1": 250.68200000000002, "r_x2": 469.787, "r_y2": 242.36900000000003, "r_x3": 396.768, "r_y3": 242.36900000000003, "coord_origin": "TOPLEFT"}, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.977, "r_y0": 239.19299999999998, "r_x1": 324.793, "r_y1": 239.19299999999998, "r_x2": 324.793, "r_y2": 233.65099999999995, "r_x3": 320.977, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.483, "r_y0": 239.19299999999998, "r_x1": 418.113, "r_y1": 239.19299999999998, "r_x2": 418.113, "r_y2": 233.65099999999995, "r_x3": 410.483, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.85, "r_y0": 239.19299999999998, "r_x1": 508.48, "r_y1": 239.19299999999998, "r_x2": 508.48, "r_y2": 233.65099999999995, "r_x3": 500.85, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.3, "r_y0": 239.19299999999998, "r_x1": 372.93, "r_y1": 239.19299999999998, "r_x2": 372.93, "r_y2": 233.65099999999995, "r_x3": 365.3, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.666, "r_y0": 239.19299999999998, "r_x1": 463.296, "r_y1": 239.19299999999998, "r_x2": 463.296, "r_y2": 233.65099999999995, "r_x3": 455.666, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 542.035, "r_y0": 239.19299999999998, "r_x1": 549.665, "r_y1": 239.19299999999998, "r_x2": 549.665, "r_y2": 233.65099999999995, "r_x3": 542.035, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 316.045, "r_y0": 236.21699999999998, "r_x1": 319.861, "r_y1": 236.21699999999998, "r_x2": 319.861, "r_y2": 230.67399999999998, "r_x3": 316.045, "r_y3": 230.67399999999998, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.625, "r_y0": 204.461, "r_x1": 320.255, "r_y1": 204.461, "r_x2": 320.255, "r_y2": 198.91899999999998, "r_x3": 312.625, "r_y3": 198.91899999999998, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.15, "r_y0": 173.86800000000005, "r_x1": 320.78, "r_y1": 173.86800000000005, "r_x2": 320.78, "r_y2": 168.32600000000002, "r_x3": 313.15, "r_y3": 168.32600000000002, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.93, "r_y0": 142.35799999999995, "r_x1": 320.56, "r_y1": 142.35799999999995, "r_x2": 320.56, "r_y2": 136.81600000000003, "r_x3": 312.93, "r_y3": 136.81600000000003, "coord_origin": "TOPLEFT"}, "text": "60", "orig": "60", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.482, "r_y0": 111.37199999999996, "r_x1": 320.112, "r_y1": 111.37199999999996, "r_x2": 320.112, "r_y2": 105.83000000000004, "r_x3": 312.482, "r_y3": 105.83000000000004, "coord_origin": "TOPLEFT"}, "text": "80", "orig": "80", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.482, "r_y0": 218.02999999999997, "r_x1": 320.112, "r_y1": 218.02999999999997, "r_x2": 320.112, "r_y2": 212.48699999999997, "r_x3": 312.482, "r_y3": 212.48699999999997, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.076, "r_y0": 189.49199999999996, "r_x1": 320.707, "r_y1": 189.49199999999996, "r_x2": 320.707, "r_y2": 183.95000000000005, "r_x3": 313.076, "r_y3": 183.95000000000005, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.763, "r_y0": 158.24400000000003, "r_x1": 320.393, "r_y1": 158.24400000000003, "r_x2": 320.393, "r_y2": 152.702, "r_x3": 312.763, "r_y3": 152.702, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.198, "r_y0": 126.34100000000001, "r_x1": 319.828, "r_y1": 126.34100000000001, "r_x2": 319.828, "r_y2": 120.798, "r_x3": 312.198, "r_y3": 120.798, "coord_origin": "TOPLEFT"}, "text": "70", "orig": "70", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.817, "r_y0": 95.87900000000002, "r_x1": 320.447, "r_y1": 95.87900000000002, "r_x2": 320.447, "r_y2": 90.33699999999999, "r_x3": 312.817, "r_y3": 90.33699999999999, "coord_origin": "TOPLEFT"}, "text": "90", "orig": "90", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.174, "r_y0": 229.94000000000005, "r_x1": 536.944, "r_y1": 229.94000000000005, "r_x2": 536.944, "r_y2": 223.01199999999994, "r_x3": 532.174, "r_y3": 223.01199999999994, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.88, "r_y0": 115.48000000000002, "r_x1": 547.613, "r_y1": 115.48000000000002, "r_x2": 547.613, "r_y2": 108.55200000000002, "r_x3": 532.88, "r_y3": 108.55200000000002, "coord_origin": "TOPLEFT"}, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.774, "r_y0": 137.99400000000003, "r_x1": 542.739, "r_y1": 137.99400000000003, "r_x2": 542.739, "r_y2": 131.06600000000003, "r_x3": 532.774, "r_y3": 131.06600000000003, "coord_origin": "TOPLEFT"}, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.799, "r_y0": 161.13599999999997, "r_x1": 542.764, "r_y1": 161.13599999999997, "r_x2": 542.764, "r_y2": 154.20799999999997, "r_x3": 532.799, "r_y3": 154.20799999999997, "coord_origin": "TOPLEFT"}, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.571, "r_y0": 183.971, "r_x1": 542.536, "r_y1": 183.971, "r_x2": 542.536, "r_y2": 177.043, "r_x3": 532.571, "r_y3": 177.043, "coord_origin": "TOPLEFT"}, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.146, "r_y0": 206.85900000000004, "r_x1": 542.111, "r_y1": 206.85900000000004, "r_x2": 542.111, "r_y2": 199.93100000000004, "r_x3": 532.146, "r_y3": 199.93100000000004, "coord_origin": "TOPLEFT"}, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 276.65700000000004, "r_x1": 346.062, "r_y1": 276.65700000000004, "r_x2": 346.062, "r_y2": 268.105, "r_x3": 308.862, "r_y3": 268.105, "coord_origin": "TOPLEFT"}, "text": "Figure 2:", "orig": "Figure 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.491, "r_y0": 276.65700000000004, "r_x1": 545.115, "r_y1": 276.65700000000004, "r_x2": 545.115, "r_y2": 268.105, "r_x3": 354.491, "r_y3": 268.105, "coord_origin": "TOPLEFT"}, "text": "Distribution of the tables across different table", "orig": "Distribution of the tables across different table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 288.612, "r_x1": 498.57, "r_y1": 288.612, "r_x2": 498.57, "r_y2": 280.06, "r_x3": 308.862, "r_y3": 280.06, "coord_origin": "TOPLEFT"}, "text": "dimensions in PubTabNet + FinTabNet datasets", "orig": "dimensions in PubTabNet + FinTabNet datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 326.294, "r_x1": 437.27, "r_y1": 326.294, "r_x2": 437.27, "r_y2": 317.742, "r_x3": 308.862, "r_y3": 317.742, "coord_origin": "TOPLEFT"}, "text": "balance in the previous datasets.", "orig": "balance in the previous datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 340.352, "r_x1": 545.115, "r_y1": 340.352, "r_x2": 545.115, "r_y2": 331.8, "r_x3": 320.817, "r_y3": 331.8, "coord_origin": "TOPLEFT"}, "text": "The PubTabNet dataset contains 509k tables delivered as", "orig": "The PubTabNet dataset contains 509k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 352.307, "r_x1": 545.115, "r_y1": 352.307, "r_x2": 545.115, "r_y2": 343.755, "r_x3": 308.862, "r_y3": 343.755, "coord_origin": "TOPLEFT"}, "text": "annotated PNGimages. The annotations consist of the table", "orig": "annotated PNGimages. The annotations consist of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 364.263, "r_x1": 545.115, "r_y1": 364.263, "r_x2": 545.115, "r_y2": 355.711, "r_x3": 308.862, "r_y3": 355.711, "coord_origin": "TOPLEFT"}, "text": "structure represented in HTML format, the tokenized text", "orig": "structure represented in HTML format, the tokenized text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 376.218, "r_x1": 545.115, "r_y1": 376.218, "r_x2": 545.115, "r_y2": 367.666, "r_x3": 308.862, "r_y3": 367.666, "coord_origin": "TOPLEFT"}, "text": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 388.173, "r_x1": 545.115, "r_y1": 388.173, "r_x2": 545.115, "r_y2": 379.621, "r_x3": 308.862, "r_y3": 379.621, "coord_origin": "TOPLEFT"}, "text": "pearance style of PubTabNet. Depending on its complexity,", "orig": "pearance style of PubTabNet. Depending on its complexity,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 400.128, "r_x1": 545.115, "r_y1": 400.128, "r_x2": 545.115, "r_y2": 391.576, "r_x3": 308.862, "r_y3": 391.576, "coord_origin": "TOPLEFT"}, "text": "a table is characterized as 'simple' when it does not contain", "orig": "a table is characterized as 'simple' when it does not contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 412.083, "r_x1": 545.115, "r_y1": 412.083, "r_x2": 545.115, "r_y2": 403.531, "r_x3": 308.862, "r_y3": 403.531, "coord_origin": "TOPLEFT"}, "text": "row spans or column spans, otherwise it is 'complex'. The", "orig": "row spans or column spans, otherwise it is 'complex'. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 424.038, "r_x1": 545.115, "r_y1": 424.038, "r_x2": 545.115, "r_y2": 415.486, "r_x3": 308.862, "r_y3": 415.486, "coord_origin": "TOPLEFT"}, "text": "dataset is divided into Train and Val splits (roughly 98%and", "orig": "dataset is divided into Train and Val splits (roughly 98%and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 435.994, "r_x1": 545.115, "r_y1": 435.994, "r_x2": 545.115, "r_y2": 427.442, "r_x3": 308.862, "r_y3": 427.442, "coord_origin": "TOPLEFT"}, "text": "2%). The Train split consists of 54% simple and 46% com-", "orig": "2%). The Train split consists of 54% simple and 46% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 447.949, "r_x1": 545.115, "r_y1": 447.949, "r_x2": 545.115, "r_y2": 439.397, "r_x3": 308.862, "r_y3": 439.397, "coord_origin": "TOPLEFT"}, "text": "plex tables and the Val split of 51% and 49% respectively.", "orig": "plex tables and the Val split of 51% and 49% respectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 459.904, "r_x1": 545.115, "r_y1": 459.904, "r_x2": 545.115, "r_y2": 451.352, "r_x3": 308.862, "r_y3": 451.352, "coord_origin": "TOPLEFT"}, "text": "The FinTabNet dataset contains 112k tables delivered as", "orig": "The FinTabNet dataset contains 112k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 471.859, "r_x1": 545.115, "r_y1": 471.859, "r_x2": 545.115, "r_y2": 463.307, "r_x3": 308.862, "r_y3": 463.307, "coord_origin": "TOPLEFT"}, "text": "single-page PDFdocuments with mixed table structures and", "orig": "single-page PDFdocuments with mixed table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 483.814, "r_x1": 358.984, "r_y1": 483.814, "r_x2": 358.984, "r_y2": 475.262, "r_x3": 308.862, "r_y3": 475.262, "coord_origin": "TOPLEFT"}, "text": "text content.", "orig": "text content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.121, "r_y0": 483.814, "r_x1": 545.115, "r_y1": 483.814, "r_x2": 545.115, "r_y2": 475.262, "r_x3": 365.121, "r_y3": 475.262, "coord_origin": "TOPLEFT"}, "text": "Similarly to the PubTabNet, the annotations", "orig": "Similarly to the PubTabNet, the annotations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 495.77, "r_x1": 545.115, "r_y1": 495.77, "r_x2": 545.115, "r_y2": 487.218, "r_x3": 308.862, "r_y3": 487.218, "coord_origin": "TOPLEFT"}, "text": "of FinTabNet include the table structure in HTML, the to-", "orig": "of FinTabNet include the table structure in HTML, the to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 507.725, "r_x1": 545.115, "r_y1": 507.725, "r_x2": 545.115, "r_y2": 499.173, "r_x3": 308.862, "r_y3": 499.173, "coord_origin": "TOPLEFT"}, "text": "kenized text and the bounding boxes on a table cell basis.", "orig": "kenized text and the bounding boxes on a table cell basis.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 519.6800000000001, "r_x1": 545.115, "r_y1": 519.6800000000001, "r_x2": 545.115, "r_y2": 511.128, "r_x3": 308.862, "r_y3": 511.128, "coord_origin": "TOPLEFT"}, "text": "The dataset is divided into Train, Test and Val splits (81%,", "orig": "The dataset is divided into Train, Test and Val splits (81%,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 531.635, "r_x1": 545.115, "r_y1": 531.635, "r_x2": 545.115, "r_y2": 523.0830000000001, "r_x3": 308.862, "r_y3": 523.0830000000001, "coord_origin": "TOPLEFT"}, "text": "9.5%, 9.5%), and each one is almost equally divided into", "orig": "9.5%, 9.5%), and each one is almost equally divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 543.59, "r_x1": 545.115, "r_y1": 543.59, "r_x2": 545.115, "r_y2": 535.038, "r_x3": 308.862, "r_y3": 535.038, "coord_origin": "TOPLEFT"}, "text": "simple and complex tables (Train: 48% simple, 52% com-", "orig": "simple and complex tables (Train: 48% simple, 52% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 555.545, "r_x1": 350.964, "r_y1": 555.545, "r_x2": 350.964, "r_y2": 546.9929999999999, "r_x3": 308.862, "r_y3": 546.9929999999999, "coord_origin": "TOPLEFT"}, "text": "plex, Test:", "orig": "plex, Test:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 355.467, "r_y0": 555.545, "r_x1": 490.082, "r_y1": 555.545, "r_x2": 490.082, "r_y2": 546.9929999999999, "r_x3": 355.467, "r_y3": 546.9929999999999, "coord_origin": "TOPLEFT"}, "text": "48% simple, 52% complex, Test:", "orig": "48% simple, 52% complex, Test:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 494.595, "r_y0": 555.545, "r_x1": 545.115, "r_y1": 555.545, "r_x2": 545.115, "r_y2": 546.9929999999999, "r_x3": 494.595, "r_y3": 546.9929999999999, "coord_origin": "TOPLEFT"}, "text": "53% simple,", "orig": "53% simple,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 567.501, "r_x1": 370.6, "r_y1": 567.501, "r_x2": 370.6, "r_y2": 558.9490000000001, "r_x3": 308.862, "r_y3": 558.9490000000001, "coord_origin": "TOPLEFT"}, "text": "47% complex).", "orig": "47% complex).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.737, "r_y0": 567.501, "r_x1": 545.115, "r_y1": 567.501, "r_x2": 545.115, "r_y2": 558.9490000000001, "r_x3": 376.737, "r_y3": 558.9490000000001, "coord_origin": "TOPLEFT"}, "text": "Finally the TableBank dataset consists of", "orig": "Finally the TableBank dataset consists of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 579.456, "r_x1": 545.115, "r_y1": 579.456, "r_x2": 545.115, "r_y2": 570.904, "r_x3": 308.862, "r_y3": 570.904, "coord_origin": "TOPLEFT"}, "text": "145k tables provided as JPEG images. The latter has anno-", "orig": "145k tables provided as JPEG images. The latter has anno-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 591.4110000000001, "r_x1": 545.115, "r_y1": 591.4110000000001, "r_x2": 545.115, "r_y2": 582.859, "r_x3": 308.862, "r_y3": 582.859, "coord_origin": "TOPLEFT"}, "text": "tations for the table structure, but only few with bounding", "orig": "tations for the table structure, but only few with bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 603.366, "r_x1": 403.726, "r_y1": 603.366, "r_x2": 403.726, "r_y2": 594.814, "r_x3": 308.862, "r_y3": 594.814, "coord_origin": "TOPLEFT"}, "text": "boxes of the table cells.", "orig": "boxes of the table cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.731, "r_y0": 603.366, "r_x1": 545.115, "r_y1": 603.366, "r_x2": 545.115, "r_y2": 594.814, "r_x3": 407.731, "r_y3": 594.814, "coord_origin": "TOPLEFT"}, "text": "The entire dataset consists of sim-", "orig": "The entire dataset consists of sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 615.321, "r_x1": 545.115, "r_y1": 615.321, "r_x2": 545.115, "r_y2": 606.769, "r_x3": 308.862, "r_y3": 606.769, "coord_origin": "TOPLEFT"}, "text": "ple tables and it is divided into 90% Train, 3% Test and 7%", "orig": "ple tables and it is divided into 90% Train, 3% Test and 7%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 627.2760000000001, "r_x1": 348.164, "r_y1": 627.2760000000001, "r_x2": 348.164, "r_y2": 618.7239999999999, "r_x3": 308.862, "r_y3": 618.7239999999999, "coord_origin": "TOPLEFT"}, "text": "Val splits.", "orig": "Val splits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 641.335, "r_x1": 545.115, "r_y1": 641.335, "r_x2": 545.115, "r_y2": 632.783, "r_x3": 320.817, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "Due to the heterogeneity across the dataset formats, it", "orig": "Due to the heterogeneity across the dataset formats, it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.29, "r_x1": 545.115, "r_y1": 653.29, "r_x2": 545.115, "r_y2": 644.738, "r_x3": 308.862, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "was necessary to combine all available data into one homog-", "orig": "was necessary to combine all available data into one homog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 665.245, "r_x1": 545.115, "r_y1": 665.245, "r_x2": 545.115, "r_y2": 656.693, "r_x3": 308.862, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "enized dataset before we could train our models for practi-", "orig": "enized dataset before we could train our models for practi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 677.201, "r_x1": 361.245, "r_y1": 677.201, "r_x2": 361.245, "r_y2": 668.649, "r_x3": 308.862, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "cal purposes.", "orig": "cal purposes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.44, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 365.44, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "Given the size of PubTabNet, we adopted its", "orig": "Given the size of PubTabNet, we adopted its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 308.862, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "annotation format and we extracted and converted all tables", "orig": "annotation format and we extracted and converted all tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 487.322, "r_y1": 701.111, "r_x2": 487.322, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "as PNG images with a resolution of 72 dpi.", "orig": "as PNG images with a resolution of 72 dpi.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 492.901, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 492.901, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Additionally,", "orig": "Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "we have filtered out tables with extreme sizes due to small", "orig": "we have filtered out tables with extreme sizes due to small", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 10, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 250.151, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.8767216801643372, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 250.151, "r_y1": 84.029, "r_x2": 250.151, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "tag-decoder which is constrained to the table-tags.", "orig": "tag-decoder which is constrained to the table-tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "text", "bbox": {"l": 50.112, "t": 87.48800000000006, "r": 286.365, "b": 275.36800000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9822593927383423, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 96.03999999999996, "r_x1": 70.366, "r_y1": 96.03999999999996, "r_x2": 70.366, "r_y2": 87.48800000000006, "r_x3": 62.067, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.931, "r_y0": 96.03999999999996, "r_x1": 110.953, "r_y1": 96.03999999999996, "r_x2": 110.953, "r_y2": 87.48800000000006, "r_x3": 76.931, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "practice,", "orig": "practice,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 118.545, "r_y0": 96.03999999999996, "r_x1": 136.258, "r_y1": 96.03999999999996, "r_x2": 136.258, "r_y2": 87.48800000000006, "r_x3": 118.545, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "both", "orig": "both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.824, "r_y0": 96.03999999999996, "r_x1": 175.372, "r_y1": 96.03999999999996, "r_x2": 175.372, "r_y2": 87.48800000000006, "r_x3": 142.824, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.947, "r_y0": 96.03999999999996, "r_x1": 232.836, "r_y1": 96.03999999999996, "r_x2": 232.836, "r_y2": 87.48800000000006, "r_x3": 181.947, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "architectures", "orig": "architectures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.411, "r_y0": 96.03999999999996, "r_x1": 265.414, "r_y1": 96.03999999999996, "r_x2": 265.414, "r_y2": 87.48800000000006, "r_x3": 239.411, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "(IETD", "orig": "(IETD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.979, "r_y0": 96.03999999999996, "r_x1": 286.365, "r_y1": 96.03999999999996, "r_x2": 286.365, "r_y2": 87.48800000000006, "r_x3": 271.979, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 107.995, "r_x1": 286.365, "r_y1": 107.995, "r_x2": 286.365, "r_y2": 99.44299999999998, "r_x3": 50.112, "r_y3": 99.44299999999998, "coord_origin": "TOPLEFT"}, "text": "IEDD) require an implicit, custom trained object-character-", "orig": "IEDD) require an implicit, custom trained object-character-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 119.95100000000002, "r_x1": 286.365, "r_y1": 119.95100000000002, "r_x2": 286.365, "r_y2": 111.399, "r_x3": 50.112, "r_y3": 111.399, "coord_origin": "TOPLEFT"}, "text": "recognition (OCR) to obtain the content of the table-cells.", "orig": "recognition (OCR) to obtain the content of the table-cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 131.90599999999995, "r_x1": 286.365, "r_y1": 131.90599999999995, "r_x2": 286.365, "r_y2": 123.35400000000004, "r_x3": 50.112, "r_y3": 123.35400000000004, "coord_origin": "TOPLEFT"}, "text": "In the case of IETD, this OCR engine is implicit in the de-", "orig": "In the case of IETD, this OCR engine is implicit in the de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 143.861, "r_x1": 286.365, "r_y1": 143.861, "r_x2": 286.365, "r_y2": 135.30899999999997, "r_x3": 50.112, "r_y3": 135.30899999999997, "coord_origin": "TOPLEFT"}, "text": "coder similar to [24]. For the IEDD, the OCR is solely em-", "orig": "coder similar to [24]. For the IEDD, the OCR is solely em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 155.81600000000003, "r_x1": 174.206, "r_y1": 155.81600000000003, "r_x2": 174.206, "r_y2": 147.264, "r_x3": 50.112, "r_y3": 147.264, "coord_origin": "TOPLEFT"}, "text": "bedded in the content-decoder.", "orig": "bedded in the content-decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 179.098, "r_y0": 155.81600000000003, "r_x1": 286.365, "r_y1": 155.81600000000003, "r_x2": 286.365, "r_y2": 147.264, "r_x3": 179.098, "r_y3": 147.264, "coord_origin": "TOPLEFT"}, "text": "This reliance on a custom,", "orig": "This reliance on a custom,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 167.77099999999996, "r_x1": 243.267, "r_y1": 167.77099999999996, "r_x2": 243.267, "r_y2": 159.21900000000005, "r_x3": 50.112, "r_y3": 159.21900000000005, "coord_origin": "TOPLEFT"}, "text": "implicit OCR decoder is of course problematic.", "orig": "implicit OCR decoder is of course problematic.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.437, "r_y0": 167.77099999999996, "r_x1": 286.365, "r_y1": 167.77099999999996, "r_x2": 286.365, "r_y2": 159.21900000000005, "r_x3": 248.437, "r_y3": 159.21900000000005, "coord_origin": "TOPLEFT"}, "text": "OCR is a", "orig": "OCR is a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 179.726, "r_x1": 286.365, "r_y1": 179.726, "r_x2": 286.365, "r_y2": 171.17399999999998, "r_x3": 50.112, "r_y3": 171.17399999999998, "coord_origin": "TOPLEFT"}, "text": "well known and extremely tough problem, that often needs", "orig": "well known and extremely tough problem, that often needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 191.68200000000002, "r_x1": 286.365, "r_y1": 191.68200000000002, "r_x2": 286.365, "r_y2": 183.13, "r_x3": 50.112, "r_y3": 183.13, "coord_origin": "TOPLEFT"}, "text": "custom training for each individual language. However, the", "orig": "custom training for each individual language. However, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 203.63699999999994, "r_x1": 126.655, "r_y1": 203.63699999999994, "r_x2": 126.655, "r_y2": 195.08500000000004, "r_x3": 50.112, "r_y3": 195.08500000000004, "coord_origin": "TOPLEFT"}, "text": "limited availability", "orig": "limited availability", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 130.59, "r_y0": 203.63699999999994, "r_x1": 142.206, "r_y1": 203.63699999999994, "r_x2": 142.206, "r_y2": 195.08500000000004, "r_x3": 130.59, "r_y3": 195.08500000000004, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 146.132, "r_y0": 203.63699999999994, "r_x1": 286.365, "r_y1": 203.63699999999994, "r_x2": 286.365, "r_y2": 195.08500000000004, "r_x3": 146.132, "r_y3": 195.08500000000004, "coord_origin": "TOPLEFT"}, "text": "non-english content in the current", "orig": "non-english content in the current", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 215.59199999999998, "r_x1": 286.365, "r_y1": 215.59199999999998, "r_x2": 286.365, "r_y2": 207.03999999999996, "r_x3": 50.112, "r_y3": 207.03999999999996, "coord_origin": "TOPLEFT"}, "text": "datasets, makes it impractical to apply the IETD and IEDD", "orig": "datasets, makes it impractical to apply the IETD and IEDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 227.54700000000003, "r_x1": 286.365, "r_y1": 227.54700000000003, "r_x2": 286.365, "r_y2": 218.995, "r_x3": 50.112, "r_y3": 218.995, "coord_origin": "TOPLEFT"}, "text": "methods on tables with other languages. Additionally, OCR", "orig": "methods on tables with other languages. Additionally, OCR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 239.50199999999995, "r_x1": 286.365, "r_y1": 239.50199999999995, "r_x2": 286.365, "r_y2": 230.95000000000005, "r_x3": 50.112, "r_y3": 230.95000000000005, "coord_origin": "TOPLEFT"}, "text": "can be completely omitted if the tables originate from pro-", "orig": "can be completely omitted if the tables originate from pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 251.457, "r_x1": 286.365, "r_y1": 251.457, "r_x2": 286.365, "r_y2": 242.90499999999997, "r_x3": 50.112, "r_y3": 242.90499999999997, "coord_origin": "TOPLEFT"}, "text": "grammatic PDF documents with known positions of each", "orig": "grammatic PDF documents with known positions of each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 263.413, "r_x1": 66.989, "r_y1": 263.413, "r_x2": 66.989, "r_y2": 254.861, "r_x3": 50.112, "r_y3": 254.861, "coord_origin": "TOPLEFT"}, "text": "cell.", "orig": "cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 71.382, "r_y0": 263.413, "r_x1": 286.365, "r_y1": 263.413, "r_x2": 286.365, "r_y2": 254.861, "r_x3": 71.382, "r_y3": 254.861, "coord_origin": "TOPLEFT"}, "text": "The latter was the inspiration for the work of this pa-", "orig": "The latter was the inspiration for the work of this pa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 275.36800000000005, "r_x1": 64.777, "r_y1": 275.36800000000005, "r_x2": 64.777, "r_y2": 266.81600000000003, "r_x3": 50.112, "r_y3": 266.81600000000003, "coord_origin": "TOPLEFT"}, "text": "per.", "orig": "per.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 50.112, "t": 278.43899999999996, "r": 286.365, "b": 490.617, "coord_origin": "TOPLEFT"}, "confidence": 0.9878450036048889, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 287.395, "r_x1": 90.301, "r_y1": 287.395, "r_x2": 90.301, "r_y2": 278.43899999999996, "r_x3": 62.067, "r_y3": 278.43899999999996, "coord_origin": "TOPLEFT"}, "text": "Graph", "orig": "Graph", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.677, "r_y0": 287.395, "r_x1": 126.007, "r_y1": 287.395, "r_x2": 126.007, "r_y2": 278.43899999999996, "r_x3": 96.677, "r_y3": 278.43899999999996, "coord_origin": "TOPLEFT"}, "text": "Neural", "orig": "Neural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.373, "r_y0": 287.395, "r_x1": 171.566, "r_y1": 287.395, "r_x2": 171.566, "r_y2": 278.43899999999996, "r_x3": 132.373, "r_y3": 278.43899999999996, "coord_origin": "TOPLEFT"}, "text": "networks", "orig": "networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.568, "r_y0": 287.379, "r_x1": 174.338, "r_y1": 287.379, "r_x2": 174.338, "r_y2": 278.827, "r_x3": 171.568, "r_y3": 278.827, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.187, "r_y0": 287.379, "r_x1": 210.083, "r_y1": 287.379, "r_x2": 210.083, "r_y2": 278.827, "r_x3": 185.187, "r_y3": 278.827, "coord_origin": "TOPLEFT"}, "text": "Graph", "orig": "Graph", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.459, "r_y0": 287.379, "r_x1": 243.568, "r_y1": 287.379, "r_x2": 243.568, "r_y2": 278.827, "r_x3": 216.459, "r_y3": 278.827, "coord_origin": "TOPLEFT"}, "text": "Neural", "orig": "Neural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.944, "r_y0": 287.379, "r_x1": 286.357, "r_y1": 287.379, "r_x2": 286.357, "r_y2": 278.827, "r_x3": 249.944, "r_y3": 278.827, "coord_origin": "TOPLEFT"}, "text": "networks", "orig": "networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 299.335, "r_x1": 84.971, "r_y1": 299.335, "r_x2": 84.971, "r_y2": 290.783, "r_x3": 50.112, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "(GNN's)", "orig": "(GNN's)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.347, "r_y0": 299.335, "r_x1": 107.845, "r_y1": 299.335, "r_x2": 107.845, "r_y2": 290.783, "r_x3": 91.347, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "take", "orig": "take", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 114.211, "r_y0": 299.335, "r_x1": 118.635, "r_y1": 299.335, "r_x2": 118.635, "r_y2": 290.783, "r_x3": 114.211, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.011, "r_y0": 299.335, "r_x1": 159.87, "r_y1": 299.335, "r_x2": 159.87, "r_y2": 290.783, "r_x3": 125.011, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "radically", "orig": "radically", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.246, "r_y0": 299.335, "r_x1": 200.298, "r_y1": 299.335, "r_x2": 200.298, "r_y2": 290.783, "r_x3": 166.246, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "different", "orig": "different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.664, "r_y0": 299.335, "r_x1": 243.177, "r_y1": 299.335, "r_x2": 243.177, "r_y2": 290.783, "r_x3": 206.664, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "approach", "orig": "approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.553, "r_y0": 299.335, "r_x1": 257.304, "r_y1": 299.335, "r_x2": 257.304, "r_y2": 290.783, "r_x3": 249.553, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.68, "r_y0": 299.335, "r_x1": 286.365, "r_y1": 299.335, "r_x2": 286.365, "r_y2": 290.783, "r_x3": 263.68, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "table-", "orig": "table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 311.29, "r_x1": 84.971, "r_y1": 311.29, "r_x2": 84.971, "r_y2": 302.738, "r_x3": 50.112, "r_y3": 302.738, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.986, "r_y0": 311.29, "r_x1": 131.168, "r_y1": 311.29, "r_x2": 131.168, "r_y2": 302.738, "r_x3": 88.986, "r_y3": 302.738, "coord_origin": "TOPLEFT"}, "text": "extraction.", "orig": "extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.849, "r_y0": 311.29, "r_x1": 286.365, "r_y1": 311.29, "r_x2": 286.365, "r_y2": 302.738, "r_x3": 138.849, "r_y3": 302.738, "coord_origin": "TOPLEFT"}, "text": "Note that one table cell can consti-", "orig": "Note that one table cell can consti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 323.245, "r_x1": 286.365, "r_y1": 323.245, "r_x2": 286.365, "r_y2": 314.693, "r_x3": 50.112, "r_y3": 314.693, "coord_origin": "TOPLEFT"}, "text": "tute out of multiple text-cells. To obtain the table-structure,", "orig": "tute out of multiple text-cells. To obtain the table-structure,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 335.2, "r_x1": 136.996, "r_y1": 335.2, "r_x2": 136.996, "r_y2": 326.648, "r_x3": 50.112, "r_y3": 326.648, "coord_origin": "TOPLEFT"}, "text": "one creates an initial", "orig": "one creates an initial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.051, "r_y0": 335.2, "r_x1": 166.226, "r_y1": 335.2, "r_x2": 166.226, "r_y2": 326.648, "r_x3": 141.051, "r_y3": 326.648, "coord_origin": "TOPLEFT"}, "text": "graph,", "orig": "graph,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.679, "r_y0": 335.2, "r_x1": 286.365, "r_y1": 335.2, "r_x2": 286.365, "r_y2": 326.648, "r_x3": 170.679, "r_y3": 326.648, "coord_origin": "TOPLEFT"}, "text": "where each of the text-cells", "orig": "where each of the text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 347.155, "r_x1": 260.442, "r_y1": 347.155, "r_x2": 260.442, "r_y2": 338.603, "r_x3": 50.112, "r_y3": 338.603, "coord_origin": "TOPLEFT"}, "text": "becomes a node in the graph similar to [33, 34, 2].", "orig": "becomes a node in the graph similar to [33, 34, 2].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.45, "r_y0": 347.155, "r_x1": 286.365, "r_y1": 347.155, "r_x2": 286.365, "r_y2": 338.603, "r_x3": 266.45, "r_y3": 338.603, "coord_origin": "TOPLEFT"}, "text": "Each", "orig": "Each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 359.11, "r_x1": 286.365, "r_y1": 359.11, "r_x2": 286.365, "r_y2": 350.558, "r_x3": 50.112, "r_y3": 350.558, "coord_origin": "TOPLEFT"}, "text": "node is then associated with en embedding vector coming", "orig": "node is then associated with en embedding vector coming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 371.066, "r_x1": 286.365, "r_y1": 371.066, "r_x2": 286.365, "r_y2": 362.514, "r_x3": 50.112, "r_y3": 362.514, "coord_origin": "TOPLEFT"}, "text": "from the encoded image, its coordinates and the encoded", "orig": "from the encoded image, its coordinates and the encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 383.021, "r_x1": 67.397, "r_y1": 383.021, "r_x2": 67.397, "r_y2": 374.469, "r_x3": 50.112, "r_y3": 374.469, "coord_origin": "TOPLEFT"}, "text": "text.", "orig": "text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 72.976, "r_y0": 383.021, "r_x1": 286.365, "r_y1": 383.021, "r_x2": 286.365, "r_y2": 374.469, "r_x3": 72.976, "r_y3": 374.469, "coord_origin": "TOPLEFT"}, "text": "Furthermore, nodes that represent adjacent text-cells", "orig": "Furthermore, nodes that represent adjacent text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 394.976, "r_x1": 92.602, "r_y1": 394.976, "r_x2": 92.602, "r_y2": 386.424, "r_x3": 50.112, "r_y3": 386.424, "coord_origin": "TOPLEFT"}, "text": "are linked.", "orig": "are linked.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 97.305, "r_y0": 394.976, "r_x1": 286.365, "r_y1": 394.976, "r_x2": 286.365, "r_y2": 386.424, "r_x3": 97.305, "r_y3": 386.424, "coord_origin": "TOPLEFT"}, "text": "Graph Convolutional Networks (GCN's) based", "orig": "Graph Convolutional Networks (GCN's) based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 406.931, "r_x1": 286.365, "r_y1": 406.931, "r_x2": 286.365, "r_y2": 398.379, "r_x3": 50.112, "r_y3": 398.379, "coord_origin": "TOPLEFT"}, "text": "methods take the image as an input, but also the position of", "orig": "methods take the image as an input, but also the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 418.886, "r_x1": 286.365, "r_y1": 418.886, "r_x2": 286.365, "r_y2": 410.334, "r_x3": 50.112, "r_y3": 410.334, "coord_origin": "TOPLEFT"}, "text": "the text-cells and their content [18]. The purpose of a GCN", "orig": "the text-cells and their content [18]. The purpose of a GCN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 430.841, "r_x1": 286.365, "r_y1": 430.841, "r_x2": 286.365, "r_y2": 422.289, "r_x3": 50.112, "r_y3": 422.289, "coord_origin": "TOPLEFT"}, "text": "is to transform the input graph into a new graph, which re-", "orig": "is to transform the input graph into a new graph, which re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 442.797, "r_x1": 198.236, "r_y1": 442.797, "r_x2": 198.236, "r_y2": 434.245, "r_x3": 50.112, "r_y3": 434.245, "coord_origin": "TOPLEFT"}, "text": "places the old links with new ones.", "orig": "places the old links with new ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 205.927, "r_y0": 442.797, "r_x1": 286.365, "r_y1": 442.797, "r_x2": 286.365, "r_y2": 434.245, "r_x3": 205.927, "r_y3": 434.245, "coord_origin": "TOPLEFT"}, "text": "The new links then", "orig": "The new links then", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 454.752, "r_x1": 165.618, "r_y1": 454.752, "r_x2": 165.618, "r_y2": 446.2, "r_x3": 50.112, "r_y3": 446.2, "coord_origin": "TOPLEFT"}, "text": "represent the table-structure.", "orig": "represent the table-structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.417, "r_y0": 454.752, "r_x1": 286.365, "r_y1": 454.752, "r_x2": 286.365, "r_y2": 446.2, "r_x3": 171.417, "r_y3": 446.2, "coord_origin": "TOPLEFT"}, "text": "With this approach, one can", "orig": "With this approach, one can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 466.707, "r_x1": 242.36, "r_y1": 466.707, "r_x2": 242.36, "r_y2": 458.155, "r_x3": 50.112, "r_y3": 458.155, "coord_origin": "TOPLEFT"}, "text": "avoid the need to build custom OCR decoders.", "orig": "avoid the need to build custom OCR decoders.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.408, "r_y0": 466.707, "r_x1": 286.365, "r_y1": 466.707, "r_x2": 286.365, "r_y2": 458.155, "r_x3": 248.408, "r_y3": 458.155, "coord_origin": "TOPLEFT"}, "text": "However,", "orig": "However,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 478.662, "r_x1": 286.365, "r_y1": 478.662, "r_x2": 286.365, "r_y2": 470.11, "r_x3": 50.112, "r_y3": 470.11, "coord_origin": "TOPLEFT"}, "text": "the quality of the reconstructed structure is not comparable", "orig": "the quality of the reconstructed structure is not comparable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 490.617, "r_x1": 186.5, "r_y1": 490.617, "r_x2": 186.5, "r_y2": 482.065, "r_x3": 50.112, "r_y3": 482.065, "coord_origin": "TOPLEFT"}, "text": "to the current state-of-the-art [18].", "orig": "to the current state-of-the-art [18].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 50.112, "t": 493.689, "r": 286.366, "b": 622.181, "coord_origin": "TOPLEFT"}, "confidence": 0.9875094294548035, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 502.645, "r_x1": 252.881, "r_y1": 502.645, "r_x2": 252.881, "r_y2": 493.689, "r_x3": 62.067, "r_y3": 493.689, "coord_origin": "TOPLEFT"}, "text": "Hybrid Deep Learning-Rule-Based approach", "orig": "Hybrid Deep Learning-Rule-Based approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 252.882, "r_y0": 502.629, "r_x1": 255.652, "r_y1": 502.629, "r_x2": 255.652, "r_y2": 494.077, "r_x3": 252.882, "r_y3": 494.077, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 258.63, "r_y0": 502.629, "r_x1": 286.366, "r_y1": 502.629, "r_x2": 286.366, "r_y2": 494.077, "r_x3": 258.63, "r_y3": 494.077, "coord_origin": "TOPLEFT"}, "text": "Apop-", "orig": "Apop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 514.5840000000001, "r_x1": 286.365, "r_y1": 514.5840000000001, "r_x2": 286.365, "r_y2": 506.032, "r_x3": 50.112, "r_y3": 506.032, "coord_origin": "TOPLEFT"}, "text": "ular current model for table-structure identification is the", "orig": "ular current model for table-structure identification is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 526.539, "r_x1": 286.365, "r_y1": 526.539, "r_x2": 286.365, "r_y2": 517.9870000000001, "r_x3": 50.112, "r_y3": 517.9870000000001, "coord_origin": "TOPLEFT"}, "text": "use of a hybrid Deep Learning-Rule-Based approach similar", "orig": "use of a hybrid Deep Learning-Rule-Based approach similar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 538.494, "r_x1": 286.365, "r_y1": 538.494, "r_x2": 286.365, "r_y2": 529.942, "r_x3": 50.112, "r_y3": 529.942, "coord_origin": "TOPLEFT"}, "text": "to [27, 29]. In this approach, one first detects the position of", "orig": "to [27, 29]. In this approach, one first detects the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 550.45, "r_x1": 286.365, "r_y1": 550.45, "r_x2": 286.365, "r_y2": 541.898, "r_x3": 50.112, "r_y3": 541.898, "coord_origin": "TOPLEFT"}, "text": "the table-cells with object detection (e.g. YoloVx or Mask-", "orig": "the table-cells with object detection (e.g. YoloVx or Mask-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 562.405, "r_x1": 286.365, "r_y1": 562.405, "r_x2": 286.365, "r_y2": 553.8530000000001, "r_x3": 50.112, "r_y3": 553.8530000000001, "coord_origin": "TOPLEFT"}, "text": "RCNN), then classifies the table into different types (from", "orig": "RCNN), then classifies the table into different types (from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 574.36, "r_x1": 59.527, "r_y1": 574.36, "r_x2": 59.527, "r_y2": 565.808, "r_x3": 50.112, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "its", "orig": "its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 64.259, "r_y0": 574.36, "r_x1": 95.8, "r_y1": 574.36, "r_x2": 95.8, "r_y2": 565.808, "r_x3": 64.259, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "images)", "orig": "images)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 100.523, "r_y0": 574.36, "r_x1": 145.105, "r_y1": 574.36, "r_x2": 145.105, "r_y2": 565.808, "r_x3": 100.523, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "and finally", "orig": "and finally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.828, "r_y0": 574.36, "r_x1": 166.983, "r_y1": 574.36, "r_x2": 166.983, "r_y2": 565.808, "r_x3": 149.828, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "uses", "orig": "uses", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.715, "r_y0": 574.36, "r_x1": 205.768, "r_y1": 574.36, "r_x2": 205.768, "r_y2": 565.808, "r_x3": 171.715, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "different", "orig": "different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.5, "r_y0": 574.36, "r_x1": 244.243, "r_y1": 574.36, "r_x2": 244.243, "r_y2": 565.808, "r_x3": 210.5, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "rule-sets", "orig": "rule-sets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.975, "r_y0": 574.36, "r_x1": 256.726, "r_y1": 574.36, "r_x2": 256.726, "r_y2": 565.808, "r_x3": 248.975, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 261.459, "r_y0": 574.36, "r_x1": 286.365, "r_y1": 574.36, "r_x2": 286.365, "r_y2": 565.808, "r_x3": 261.459, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "obtain", "orig": "obtain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 586.315, "r_x1": 122.64, "r_y1": 586.315, "r_x2": 122.64, "r_y2": 577.763, "r_x3": 50.112, "r_y3": 577.763, "coord_origin": "TOPLEFT"}, "text": "its table-structure.", "orig": "its table-structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 127.482, "r_y0": 586.315, "r_x1": 286.365, "r_y1": 586.315, "r_x2": 286.365, "r_y2": 577.763, "r_x3": 127.482, "r_y3": 577.763, "coord_origin": "TOPLEFT"}, "text": "Currently, this approach achieves state-", "orig": "Currently, this approach achieves state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 598.27, "r_x1": 87.731, "r_y1": 598.27, "r_x2": 87.731, "r_y2": 589.718, "r_x3": 50.112, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "of-the-art", "orig": "of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.074, "r_y0": 598.27, "r_x1": 120.577, "r_y1": 598.27, "r_x2": 120.577, "r_y2": 589.718, "r_x3": 92.074, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "results,", "orig": "results,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.389, "r_y0": 598.27, "r_x1": 137.922, "r_y1": 598.27, "r_x2": 137.922, "r_y2": 589.718, "r_x3": 125.389, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "but", "orig": "but", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.266, "r_y0": 598.27, "r_x1": 148.911, "r_y1": 598.27, "r_x2": 148.911, "r_y2": 589.718, "r_x3": 142.266, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.255, "r_y0": 598.27, "r_x1": 165.987, "r_y1": 598.27, "r_x2": 165.987, "r_y2": 589.718, "r_x3": 153.255, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "not", "orig": "not", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.331, "r_y0": 598.27, "r_x1": 286.365, "r_y1": 598.27, "r_x2": 286.365, "r_y2": 589.718, "r_x3": 170.331, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "an end-to-end deep-learning", "orig": "an end-to-end deep-learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 610.225, "r_x1": 82.49, "r_y1": 610.225, "r_x2": 82.49, "r_y2": 601.673, "r_x3": 50.112, "r_y3": 601.673, "coord_origin": "TOPLEFT"}, "text": "method.", "orig": "method.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.173, "r_y0": 610.225, "r_x1": 286.365, "r_y1": 610.225, "r_x2": 286.365, "r_y2": 601.673, "r_x3": 87.173, "r_y3": 601.673, "coord_origin": "TOPLEFT"}, "text": "As such, new rules need to be written if different", "orig": "As such, new rules need to be written if different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 622.181, "r_x1": 175.989, "r_y1": 622.181, "r_x2": 175.989, "r_y2": 613.629, "r_x3": 50.112, "r_y3": 613.629, "coord_origin": "TOPLEFT"}, "text": "types of tables are encountered.", "orig": "types of tables are encountered.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "section_header", "bbox": {"l": 50.112, "t": 635.9449999999999, "r": 105.225, "b": 646.693, "coord_origin": "TOPLEFT"}, "confidence": 0.9423062205314636, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 646.693, "r_x1": 105.225, "r_y1": 646.693, "r_x2": 105.225, "r_y2": 635.9449999999999, "r_x3": 50.112, "r_y3": 635.9449999999999, "coord_origin": "TOPLEFT"}, "text": "3. Datasets", "orig": "3. Datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 50.112, "t": 656.694, "r": 286.365, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9862047433853149, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 665.246, "r_x1": 286.365, "r_y1": 665.246, "r_x2": 286.365, "r_y2": 656.694, "r_x3": 62.067, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "We rely on large-scale datasets such as PubTabNet [37],", "orig": "We rely on large-scale datasets such as PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.201, "r_x1": 286.365, "r_y1": 677.201, "r_x2": 286.365, "r_y2": 668.649, "r_x3": 50.112, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "FinTabNet [36], and TableBank [17] datasets to train and", "orig": "FinTabNet [36], and TableBank [17] datasets to train and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 133.479, "r_y1": 689.156, "r_x2": 133.479, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "evaluate our models.", "orig": "evaluate our models.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.271, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 138.271, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "These datasets span over various ap-", "orig": "These datasets span over various ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 166.246, "r_y1": 701.111, "r_x2": 166.246, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "pearance styles and content.", "orig": "pearance styles and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 173.688, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 173.688, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "We also introduce our own", "orig": "We also introduce our own", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "synthetically generated SynthTabNet dataset to fix an im-", "orig": "synthetically generated SynthTabNet dataset to fix an im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "picture", "bbox": {"l": 312.10369873046875, "t": 78.44086456298828, "r": 550.38916015625, "b": 250.60984802246094, "coord_origin": "TOPLEFT"}, "confidence": 0.9746918082237244, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.799, "r_y0": 88.46699999999998, "r_x1": 486.849, "r_y1": 88.46699999999998, "r_x2": 486.849, "r_y2": 80.154, "r_x3": 380.799, "r_y3": 80.154, "coord_origin": "TOPLEFT"}, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.768, "r_y0": 250.68200000000002, "r_x1": 469.787, "r_y1": 250.68200000000002, "r_x2": 469.787, "r_y2": 242.36900000000003, "r_x3": 396.768, "r_y3": 242.36900000000003, "coord_origin": "TOPLEFT"}, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.977, "r_y0": 239.19299999999998, "r_x1": 324.793, "r_y1": 239.19299999999998, "r_x2": 324.793, "r_y2": 233.65099999999995, "r_x3": 320.977, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.483, "r_y0": 239.19299999999998, "r_x1": 418.113, "r_y1": 239.19299999999998, "r_x2": 418.113, "r_y2": 233.65099999999995, "r_x3": 410.483, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.85, "r_y0": 239.19299999999998, "r_x1": 508.48, "r_y1": 239.19299999999998, "r_x2": 508.48, "r_y2": 233.65099999999995, "r_x3": 500.85, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.3, "r_y0": 239.19299999999998, "r_x1": 372.93, "r_y1": 239.19299999999998, "r_x2": 372.93, "r_y2": 233.65099999999995, "r_x3": 365.3, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.666, "r_y0": 239.19299999999998, "r_x1": 463.296, "r_y1": 239.19299999999998, "r_x2": 463.296, "r_y2": 233.65099999999995, "r_x3": 455.666, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 542.035, "r_y0": 239.19299999999998, "r_x1": 549.665, "r_y1": 239.19299999999998, "r_x2": 549.665, "r_y2": 233.65099999999995, "r_x3": 542.035, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 316.045, "r_y0": 236.21699999999998, "r_x1": 319.861, "r_y1": 236.21699999999998, "r_x2": 319.861, "r_y2": 230.67399999999998, "r_x3": 316.045, "r_y3": 230.67399999999998, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.625, "r_y0": 204.461, "r_x1": 320.255, "r_y1": 204.461, "r_x2": 320.255, "r_y2": 198.91899999999998, "r_x3": 312.625, "r_y3": 198.91899999999998, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.15, "r_y0": 173.86800000000005, "r_x1": 320.78, "r_y1": 173.86800000000005, "r_x2": 320.78, "r_y2": 168.32600000000002, "r_x3": 313.15, "r_y3": 168.32600000000002, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.93, "r_y0": 142.35799999999995, "r_x1": 320.56, "r_y1": 142.35799999999995, "r_x2": 320.56, "r_y2": 136.81600000000003, "r_x3": 312.93, "r_y3": 136.81600000000003, "coord_origin": "TOPLEFT"}, "text": "60", "orig": "60", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.482, "r_y0": 111.37199999999996, "r_x1": 320.112, "r_y1": 111.37199999999996, "r_x2": 320.112, "r_y2": 105.83000000000004, "r_x3": 312.482, "r_y3": 105.83000000000004, "coord_origin": "TOPLEFT"}, "text": "80", "orig": "80", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.482, "r_y0": 218.02999999999997, "r_x1": 320.112, "r_y1": 218.02999999999997, "r_x2": 320.112, "r_y2": 212.48699999999997, "r_x3": 312.482, "r_y3": 212.48699999999997, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.076, "r_y0": 189.49199999999996, "r_x1": 320.707, "r_y1": 189.49199999999996, "r_x2": 320.707, "r_y2": 183.95000000000005, "r_x3": 313.076, "r_y3": 183.95000000000005, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.763, "r_y0": 158.24400000000003, "r_x1": 320.393, "r_y1": 158.24400000000003, "r_x2": 320.393, "r_y2": 152.702, "r_x3": 312.763, "r_y3": 152.702, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.198, "r_y0": 126.34100000000001, "r_x1": 319.828, "r_y1": 126.34100000000001, "r_x2": 319.828, "r_y2": 120.798, "r_x3": 312.198, "r_y3": 120.798, "coord_origin": "TOPLEFT"}, "text": "70", "orig": "70", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.817, "r_y0": 95.87900000000002, "r_x1": 320.447, "r_y1": 95.87900000000002, "r_x2": 320.447, "r_y2": 90.33699999999999, "r_x3": 312.817, "r_y3": 90.33699999999999, "coord_origin": "TOPLEFT"}, "text": "90", "orig": "90", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.174, "r_y0": 229.94000000000005, "r_x1": 536.944, "r_y1": 229.94000000000005, "r_x2": 536.944, "r_y2": 223.01199999999994, "r_x3": 532.174, "r_y3": 223.01199999999994, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.88, "r_y0": 115.48000000000002, "r_x1": 547.613, "r_y1": 115.48000000000002, "r_x2": 547.613, "r_y2": 108.55200000000002, "r_x3": 532.88, "r_y3": 108.55200000000002, "coord_origin": "TOPLEFT"}, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.774, "r_y0": 137.99400000000003, "r_x1": 542.739, "r_y1": 137.99400000000003, "r_x2": 542.739, "r_y2": 131.06600000000003, "r_x3": 532.774, "r_y3": 131.06600000000003, "coord_origin": "TOPLEFT"}, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.799, "r_y0": 161.13599999999997, "r_x1": 542.764, "r_y1": 161.13599999999997, "r_x2": 542.764, "r_y2": 154.20799999999997, "r_x3": 532.799, "r_y3": 154.20799999999997, "coord_origin": "TOPLEFT"}, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.571, "r_y0": 183.971, "r_x1": 542.536, "r_y1": 183.971, "r_x2": 542.536, "r_y2": 177.043, "r_x3": 532.571, "r_y3": 177.043, "coord_origin": "TOPLEFT"}, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.146, "r_y0": 206.85900000000004, "r_x1": 542.111, "r_y1": 206.85900000000004, "r_x2": 542.111, "r_y2": 199.93100000000004, "r_x3": 532.146, "r_y3": 199.93100000000004, "coord_origin": "TOPLEFT"}, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 12, "label": "section_header", "bbox": {"l": 380.799, "t": 80.154, "r": 486.849, "b": 88.46699999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.5687217116355896, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.799, "r_y0": 88.46699999999998, "r_x1": 486.849, "r_y1": 88.46699999999998, "r_x2": 486.849, "r_y2": 80.154, "r_x3": 380.799, "r_y3": 80.154, "coord_origin": "TOPLEFT"}, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 396.768, "t": 242.36900000000003, "r": 469.787, "b": 250.68200000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.768, "r_y0": 250.68200000000002, "r_x1": 469.787, "r_y1": 250.68200000000002, "r_x2": 469.787, "r_y2": 242.36900000000003, "r_x3": 396.768, "r_y3": 242.36900000000003, "coord_origin": "TOPLEFT"}, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "text", "bbox": {"l": 320.977, "t": 233.65099999999995, "r": 324.793, "b": 239.19299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.977, "r_y0": 239.19299999999998, "r_x1": 324.793, "r_y1": 239.19299999999998, "r_x2": 324.793, "r_y2": 233.65099999999995, "r_x3": 320.977, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 410.483, "t": 233.65099999999995, "r": 418.113, "b": 239.19299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.483, "r_y0": 239.19299999999998, "r_x1": 418.113, "r_y1": 239.19299999999998, "r_x2": 418.113, "r_y2": 233.65099999999995, "r_x3": 410.483, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 500.85, "t": 233.65099999999995, "r": 508.48, "b": 239.19299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.85, "r_y0": 239.19299999999998, "r_x1": 508.48, "r_y1": 239.19299999999998, "r_x2": 508.48, "r_y2": 233.65099999999995, "r_x3": 500.85, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 365.3, "t": 233.65099999999995, "r": 372.93, "b": 239.19299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.3, "r_y0": 239.19299999999998, "r_x1": 372.93, "r_y1": 239.19299999999998, "r_x2": 372.93, "r_y2": 233.65099999999995, "r_x3": 365.3, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 455.666, "t": 233.65099999999995, "r": 463.296, "b": 239.19299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.666, "r_y0": 239.19299999999998, "r_x1": 463.296, "r_y1": 239.19299999999998, "r_x2": 463.296, "r_y2": 233.65099999999995, "r_x3": 455.666, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 542.035, "t": 233.65099999999995, "r": 549.665, "b": 239.19299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 542.035, "r_y0": 239.19299999999998, "r_x1": 549.665, "r_y1": 239.19299999999998, "r_x2": 549.665, "r_y2": 233.65099999999995, "r_x3": 542.035, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 316.045, "t": 230.67399999999998, "r": 319.861, "b": 236.21699999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 316.045, "r_y0": 236.21699999999998, "r_x1": 319.861, "r_y1": 236.21699999999998, "r_x2": 319.861, "r_y2": 230.67399999999998, "r_x3": 316.045, "r_y3": 230.67399999999998, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 312.625, "t": 198.91899999999998, "r": 320.255, "b": 204.461, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.625, "r_y0": 204.461, "r_x1": 320.255, "r_y1": 204.461, "r_x2": 320.255, "r_y2": 198.91899999999998, "r_x3": 312.625, "r_y3": 198.91899999999998, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 313.15, "t": 168.32600000000002, "r": 320.78, "b": 173.86800000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.15, "r_y0": 173.86800000000005, "r_x1": 320.78, "r_y1": 173.86800000000005, "r_x2": 320.78, "r_y2": 168.32600000000002, "r_x3": 313.15, "r_y3": 168.32600000000002, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 312.93, "t": 136.81600000000003, "r": 320.56, "b": 142.35799999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.93, "r_y0": 142.35799999999995, "r_x1": 320.56, "r_y1": 142.35799999999995, "r_x2": 320.56, "r_y2": 136.81600000000003, "r_x3": 312.93, "r_y3": 136.81600000000003, "coord_origin": "TOPLEFT"}, "text": "60", "orig": "60", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 312.482, "t": 105.83000000000004, "r": 320.112, "b": 111.37199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.482, "r_y0": 111.37199999999996, "r_x1": 320.112, "r_y1": 111.37199999999996, "r_x2": 320.112, "r_y2": 105.83000000000004, "r_x3": 312.482, "r_y3": 105.83000000000004, "coord_origin": "TOPLEFT"}, "text": "80", "orig": "80", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 312.482, "t": 212.48699999999997, "r": 320.112, "b": 218.02999999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.482, "r_y0": 218.02999999999997, "r_x1": 320.112, "r_y1": 218.02999999999997, "r_x2": 320.112, "r_y2": 212.48699999999997, "r_x3": 312.482, "r_y3": 212.48699999999997, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 313.076, "t": 183.95000000000005, "r": 320.707, "b": 189.49199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.076, "r_y0": 189.49199999999996, "r_x1": 320.707, "r_y1": 189.49199999999996, "r_x2": 320.707, "r_y2": 183.95000000000005, "r_x3": 313.076, "r_y3": 183.95000000000005, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 312.763, "t": 152.702, "r": 320.393, "b": 158.24400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.763, "r_y0": 158.24400000000003, "r_x1": 320.393, "r_y1": 158.24400000000003, "r_x2": 320.393, "r_y2": 152.702, "r_x3": 312.763, "r_y3": 152.702, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 312.198, "t": 120.798, "r": 319.828, "b": 126.34100000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.198, "r_y0": 126.34100000000001, "r_x1": 319.828, "r_y1": 126.34100000000001, "r_x2": 319.828, "r_y2": 120.798, "r_x3": 312.198, "r_y3": 120.798, "coord_origin": "TOPLEFT"}, "text": "70", "orig": "70", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 312.817, "t": 90.33699999999999, "r": 320.447, "b": 95.87900000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.817, "r_y0": 95.87900000000002, "r_x1": 320.447, "r_y1": 95.87900000000002, "r_x2": 320.447, "r_y2": 90.33699999999999, "r_x3": 312.817, "r_y3": 90.33699999999999, "coord_origin": "TOPLEFT"}, "text": "90", "orig": "90", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 532.174, "t": 223.01199999999994, "r": 536.944, "b": 229.94000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.174, "r_y0": 229.94000000000005, "r_x1": 536.944, "r_y1": 229.94000000000005, "r_x2": 536.944, "r_y2": 223.01199999999994, "r_x3": 532.174, "r_y3": 223.01199999999994, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 532.88, "t": 108.55200000000002, "r": 547.613, "b": 115.48000000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.88, "r_y0": 115.48000000000002, "r_x1": 547.613, "r_y1": 115.48000000000002, "r_x2": 547.613, "r_y2": 108.55200000000002, "r_x3": 532.88, "r_y3": 108.55200000000002, "coord_origin": "TOPLEFT"}, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 532.774, "t": 131.06600000000003, "r": 542.739, "b": 137.99400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.774, "r_y0": 137.99400000000003, "r_x1": 542.739, "r_y1": 137.99400000000003, "r_x2": 542.739, "r_y2": 131.06600000000003, "r_x3": 532.774, "r_y3": 131.06600000000003, "coord_origin": "TOPLEFT"}, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 532.799, "t": 154.20799999999997, "r": 542.764, "b": 161.13599999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.799, "r_y0": 161.13599999999997, "r_x1": 542.764, "r_y1": 161.13599999999997, "r_x2": 542.764, "r_y2": 154.20799999999997, "r_x3": 532.799, "r_y3": 154.20799999999997, "coord_origin": "TOPLEFT"}, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 532.571, "t": 177.043, "r": 542.536, "b": 183.971, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.571, "r_y0": 183.971, "r_x1": 542.536, "r_y1": 183.971, "r_x2": 542.536, "r_y2": 177.043, "r_x3": 532.571, "r_y3": 177.043, "coord_origin": "TOPLEFT"}, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 532.146, "t": 199.93100000000004, "r": 542.111, "b": 206.85900000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.146, "r_y0": 206.85900000000004, "r_x1": 542.111, "r_y1": 206.85900000000004, "r_x2": 542.111, "r_y2": 199.93100000000004, "r_x3": 532.146, "r_y3": 199.93100000000004, "coord_origin": "TOPLEFT"}, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 7, "label": "caption", "bbox": {"l": 308.862, "t": 268.105, "r": 545.115, "b": 288.612, "coord_origin": "TOPLEFT"}, "confidence": 0.9667505025863647, "cells": [{"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 276.65700000000004, "r_x1": 346.062, "r_y1": 276.65700000000004, "r_x2": 346.062, "r_y2": 268.105, "r_x3": 308.862, "r_y3": 268.105, "coord_origin": "TOPLEFT"}, "text": "Figure 2:", "orig": "Figure 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.491, "r_y0": 276.65700000000004, "r_x1": 545.115, "r_y1": 276.65700000000004, "r_x2": 545.115, "r_y2": 268.105, "r_x3": 354.491, "r_y3": 268.105, "coord_origin": "TOPLEFT"}, "text": "Distribution of the tables across different table", "orig": "Distribution of the tables across different table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 288.612, "r_x1": 498.57, "r_y1": 288.612, "r_x2": 498.57, "r_y2": 280.06, "r_x3": 308.862, "r_y3": 280.06, "coord_origin": "TOPLEFT"}, "text": "dimensions in PubTabNet + FinTabNet datasets", "orig": "dimensions in PubTabNet + FinTabNet datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "text", "bbox": {"l": 308.862, "t": 317.742, "r": 437.27, "b": 326.294, "coord_origin": "TOPLEFT"}, "confidence": 0.8879811763763428, "cells": [{"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 326.294, "r_x1": 437.27, "r_y1": 326.294, "r_x2": 437.27, "r_y2": 317.742, "r_x3": 308.862, "r_y3": 317.742, "coord_origin": "TOPLEFT"}, "text": "balance in the previous datasets.", "orig": "balance in the previous datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 308.862, "t": 331.8, "r": 545.115, "b": 627.2760000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9870319366455078, "cells": [{"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 340.352, "r_x1": 545.115, "r_y1": 340.352, "r_x2": 545.115, "r_y2": 331.8, "r_x3": 320.817, "r_y3": 331.8, "coord_origin": "TOPLEFT"}, "text": "The PubTabNet dataset contains 509k tables delivered as", "orig": "The PubTabNet dataset contains 509k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 352.307, "r_x1": 545.115, "r_y1": 352.307, "r_x2": 545.115, "r_y2": 343.755, "r_x3": 308.862, "r_y3": 343.755, "coord_origin": "TOPLEFT"}, "text": "annotated PNGimages. The annotations consist of the table", "orig": "annotated PNGimages. The annotations consist of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 364.263, "r_x1": 545.115, "r_y1": 364.263, "r_x2": 545.115, "r_y2": 355.711, "r_x3": 308.862, "r_y3": 355.711, "coord_origin": "TOPLEFT"}, "text": "structure represented in HTML format, the tokenized text", "orig": "structure represented in HTML format, the tokenized text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 376.218, "r_x1": 545.115, "r_y1": 376.218, "r_x2": 545.115, "r_y2": 367.666, "r_x3": 308.862, "r_y3": 367.666, "coord_origin": "TOPLEFT"}, "text": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 388.173, "r_x1": 545.115, "r_y1": 388.173, "r_x2": 545.115, "r_y2": 379.621, "r_x3": 308.862, "r_y3": 379.621, "coord_origin": "TOPLEFT"}, "text": "pearance style of PubTabNet. Depending on its complexity,", "orig": "pearance style of PubTabNet. Depending on its complexity,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 400.128, "r_x1": 545.115, "r_y1": 400.128, "r_x2": 545.115, "r_y2": 391.576, "r_x3": 308.862, "r_y3": 391.576, "coord_origin": "TOPLEFT"}, "text": "a table is characterized as 'simple' when it does not contain", "orig": "a table is characterized as 'simple' when it does not contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 412.083, "r_x1": 545.115, "r_y1": 412.083, "r_x2": 545.115, "r_y2": 403.531, "r_x3": 308.862, "r_y3": 403.531, "coord_origin": "TOPLEFT"}, "text": "row spans or column spans, otherwise it is 'complex'. The", "orig": "row spans or column spans, otherwise it is 'complex'. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 424.038, "r_x1": 545.115, "r_y1": 424.038, "r_x2": 545.115, "r_y2": 415.486, "r_x3": 308.862, "r_y3": 415.486, "coord_origin": "TOPLEFT"}, "text": "dataset is divided into Train and Val splits (roughly 98%and", "orig": "dataset is divided into Train and Val splits (roughly 98%and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 435.994, "r_x1": 545.115, "r_y1": 435.994, "r_x2": 545.115, "r_y2": 427.442, "r_x3": 308.862, "r_y3": 427.442, "coord_origin": "TOPLEFT"}, "text": "2%). The Train split consists of 54% simple and 46% com-", "orig": "2%). The Train split consists of 54% simple and 46% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 447.949, "r_x1": 545.115, "r_y1": 447.949, "r_x2": 545.115, "r_y2": 439.397, "r_x3": 308.862, "r_y3": 439.397, "coord_origin": "TOPLEFT"}, "text": "plex tables and the Val split of 51% and 49% respectively.", "orig": "plex tables and the Val split of 51% and 49% respectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 459.904, "r_x1": 545.115, "r_y1": 459.904, "r_x2": 545.115, "r_y2": 451.352, "r_x3": 308.862, "r_y3": 451.352, "coord_origin": "TOPLEFT"}, "text": "The FinTabNet dataset contains 112k tables delivered as", "orig": "The FinTabNet dataset contains 112k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 471.859, "r_x1": 545.115, "r_y1": 471.859, "r_x2": 545.115, "r_y2": 463.307, "r_x3": 308.862, "r_y3": 463.307, "coord_origin": "TOPLEFT"}, "text": "single-page PDFdocuments with mixed table structures and", "orig": "single-page PDFdocuments with mixed table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 483.814, "r_x1": 358.984, "r_y1": 483.814, "r_x2": 358.984, "r_y2": 475.262, "r_x3": 308.862, "r_y3": 475.262, "coord_origin": "TOPLEFT"}, "text": "text content.", "orig": "text content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.121, "r_y0": 483.814, "r_x1": 545.115, "r_y1": 483.814, "r_x2": 545.115, "r_y2": 475.262, "r_x3": 365.121, "r_y3": 475.262, "coord_origin": "TOPLEFT"}, "text": "Similarly to the PubTabNet, the annotations", "orig": "Similarly to the PubTabNet, the annotations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 495.77, "r_x1": 545.115, "r_y1": 495.77, "r_x2": 545.115, "r_y2": 487.218, "r_x3": 308.862, "r_y3": 487.218, "coord_origin": "TOPLEFT"}, "text": "of FinTabNet include the table structure in HTML, the to-", "orig": "of FinTabNet include the table structure in HTML, the to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 507.725, "r_x1": 545.115, "r_y1": 507.725, "r_x2": 545.115, "r_y2": 499.173, "r_x3": 308.862, "r_y3": 499.173, "coord_origin": "TOPLEFT"}, "text": "kenized text and the bounding boxes on a table cell basis.", "orig": "kenized text and the bounding boxes on a table cell basis.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 519.6800000000001, "r_x1": 545.115, "r_y1": 519.6800000000001, "r_x2": 545.115, "r_y2": 511.128, "r_x3": 308.862, "r_y3": 511.128, "coord_origin": "TOPLEFT"}, "text": "The dataset is divided into Train, Test and Val splits (81%,", "orig": "The dataset is divided into Train, Test and Val splits (81%,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 531.635, "r_x1": 545.115, "r_y1": 531.635, "r_x2": 545.115, "r_y2": 523.0830000000001, "r_x3": 308.862, "r_y3": 523.0830000000001, "coord_origin": "TOPLEFT"}, "text": "9.5%, 9.5%), and each one is almost equally divided into", "orig": "9.5%, 9.5%), and each one is almost equally divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 543.59, "r_x1": 545.115, "r_y1": 543.59, "r_x2": 545.115, "r_y2": 535.038, "r_x3": 308.862, "r_y3": 535.038, "coord_origin": "TOPLEFT"}, "text": "simple and complex tables (Train: 48% simple, 52% com-", "orig": "simple and complex tables (Train: 48% simple, 52% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 555.545, "r_x1": 350.964, "r_y1": 555.545, "r_x2": 350.964, "r_y2": 546.9929999999999, "r_x3": 308.862, "r_y3": 546.9929999999999, "coord_origin": "TOPLEFT"}, "text": "plex, Test:", "orig": "plex, Test:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 355.467, "r_y0": 555.545, "r_x1": 490.082, "r_y1": 555.545, "r_x2": 490.082, "r_y2": 546.9929999999999, "r_x3": 355.467, "r_y3": 546.9929999999999, "coord_origin": "TOPLEFT"}, "text": "48% simple, 52% complex, Test:", "orig": "48% simple, 52% complex, Test:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 494.595, "r_y0": 555.545, "r_x1": 545.115, "r_y1": 555.545, "r_x2": 545.115, "r_y2": 546.9929999999999, "r_x3": 494.595, "r_y3": 546.9929999999999, "coord_origin": "TOPLEFT"}, "text": "53% simple,", "orig": "53% simple,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 567.501, "r_x1": 370.6, "r_y1": 567.501, "r_x2": 370.6, "r_y2": 558.9490000000001, "r_x3": 308.862, "r_y3": 558.9490000000001, "coord_origin": "TOPLEFT"}, "text": "47% complex).", "orig": "47% complex).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.737, "r_y0": 567.501, "r_x1": 545.115, "r_y1": 567.501, "r_x2": 545.115, "r_y2": 558.9490000000001, "r_x3": 376.737, "r_y3": 558.9490000000001, "coord_origin": "TOPLEFT"}, "text": "Finally the TableBank dataset consists of", "orig": "Finally the TableBank dataset consists of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 579.456, "r_x1": 545.115, "r_y1": 579.456, "r_x2": 545.115, "r_y2": 570.904, "r_x3": 308.862, "r_y3": 570.904, "coord_origin": "TOPLEFT"}, "text": "145k tables provided as JPEG images. The latter has anno-", "orig": "145k tables provided as JPEG images. The latter has anno-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 591.4110000000001, "r_x1": 545.115, "r_y1": 591.4110000000001, "r_x2": 545.115, "r_y2": 582.859, "r_x3": 308.862, "r_y3": 582.859, "coord_origin": "TOPLEFT"}, "text": "tations for the table structure, but only few with bounding", "orig": "tations for the table structure, but only few with bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 603.366, "r_x1": 403.726, "r_y1": 603.366, "r_x2": 403.726, "r_y2": 594.814, "r_x3": 308.862, "r_y3": 594.814, "coord_origin": "TOPLEFT"}, "text": "boxes of the table cells.", "orig": "boxes of the table cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.731, "r_y0": 603.366, "r_x1": 545.115, "r_y1": 603.366, "r_x2": 545.115, "r_y2": 594.814, "r_x3": 407.731, "r_y3": 594.814, "coord_origin": "TOPLEFT"}, "text": "The entire dataset consists of sim-", "orig": "The entire dataset consists of sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 615.321, "r_x1": 545.115, "r_y1": 615.321, "r_x2": 545.115, "r_y2": 606.769, "r_x3": 308.862, "r_y3": 606.769, "coord_origin": "TOPLEFT"}, "text": "ple tables and it is divided into 90% Train, 3% Test and 7%", "orig": "ple tables and it is divided into 90% Train, 3% Test and 7%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 627.2760000000001, "r_x1": 348.164, "r_y1": 627.2760000000001, "r_x2": 348.164, "r_y2": 618.7239999999999, "r_x3": 308.862, "r_y3": 618.7239999999999, "coord_origin": "TOPLEFT"}, "text": "Val splits.", "orig": "Val splits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "text", "bbox": {"l": 308.862, "t": 632.783, "r": 545.115, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9840091466903687, "cells": [{"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 641.335, "r_x1": 545.115, "r_y1": 641.335, "r_x2": 545.115, "r_y2": 632.783, "r_x3": 320.817, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "Due to the heterogeneity across the dataset formats, it", "orig": "Due to the heterogeneity across the dataset formats, it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.29, "r_x1": 545.115, "r_y1": 653.29, "r_x2": 545.115, "r_y2": 644.738, "r_x3": 308.862, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "was necessary to combine all available data into one homog-", "orig": "was necessary to combine all available data into one homog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 665.245, "r_x1": 545.115, "r_y1": 665.245, "r_x2": 545.115, "r_y2": 656.693, "r_x3": 308.862, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "enized dataset before we could train our models for practi-", "orig": "enized dataset before we could train our models for practi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 677.201, "r_x1": 361.245, "r_y1": 677.201, "r_x2": 361.245, "r_y2": 668.649, "r_x3": 308.862, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "cal purposes.", "orig": "cal purposes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.44, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 365.44, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "Given the size of PubTabNet, we adopted its", "orig": "Given the size of PubTabNet, we adopted its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 308.862, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "annotation format and we extracted and converted all tables", "orig": "annotation format and we extracted and converted all tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 487.322, "r_y1": 701.111, "r_x2": 487.322, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "as PNG images with a resolution of 72 dpi.", "orig": "as PNG images with a resolution of 72 dpi.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 492.901, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 492.901, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Additionally,", "orig": "Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "we have filtered out tables with extreme sizes due to small", "orig": "we have filtered out tables with extreme sizes due to small", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8715606927871704, "cells": [{"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "text", "id": 10, "page_no": 2, "cluster": {"id": 10, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 250.151, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.8767216801643372, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 250.151, "r_y1": 84.029, "r_x2": 250.151, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "tag-decoder which is constrained to the table-tags.", "orig": "tag-decoder which is constrained to the table-tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "tag-decoder which is constrained to the table-tags."}, {"label": "text", "id": 5, "page_no": 2, "cluster": {"id": 5, "label": "text", "bbox": {"l": 50.112, "t": 87.48800000000006, "r": 286.365, "b": 275.36800000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9822593927383423, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 96.03999999999996, "r_x1": 70.366, "r_y1": 96.03999999999996, "r_x2": 70.366, "r_y2": 87.48800000000006, "r_x3": 62.067, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.931, "r_y0": 96.03999999999996, "r_x1": 110.953, "r_y1": 96.03999999999996, "r_x2": 110.953, "r_y2": 87.48800000000006, "r_x3": 76.931, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "practice,", "orig": "practice,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 118.545, "r_y0": 96.03999999999996, "r_x1": 136.258, "r_y1": 96.03999999999996, "r_x2": 136.258, "r_y2": 87.48800000000006, "r_x3": 118.545, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "both", "orig": "both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.824, "r_y0": 96.03999999999996, "r_x1": 175.372, "r_y1": 96.03999999999996, "r_x2": 175.372, "r_y2": 87.48800000000006, "r_x3": 142.824, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.947, "r_y0": 96.03999999999996, "r_x1": 232.836, "r_y1": 96.03999999999996, "r_x2": 232.836, "r_y2": 87.48800000000006, "r_x3": 181.947, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "architectures", "orig": "architectures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.411, "r_y0": 96.03999999999996, "r_x1": 265.414, "r_y1": 96.03999999999996, "r_x2": 265.414, "r_y2": 87.48800000000006, "r_x3": 239.411, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "(IETD", "orig": "(IETD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.979, "r_y0": 96.03999999999996, "r_x1": 286.365, "r_y1": 96.03999999999996, "r_x2": 286.365, "r_y2": 87.48800000000006, "r_x3": 271.979, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 107.995, "r_x1": 286.365, "r_y1": 107.995, "r_x2": 286.365, "r_y2": 99.44299999999998, "r_x3": 50.112, "r_y3": 99.44299999999998, "coord_origin": "TOPLEFT"}, "text": "IEDD) require an implicit, custom trained object-character-", "orig": "IEDD) require an implicit, custom trained object-character-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 119.95100000000002, "r_x1": 286.365, "r_y1": 119.95100000000002, "r_x2": 286.365, "r_y2": 111.399, "r_x3": 50.112, "r_y3": 111.399, "coord_origin": "TOPLEFT"}, "text": "recognition (OCR) to obtain the content of the table-cells.", "orig": "recognition (OCR) to obtain the content of the table-cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 131.90599999999995, "r_x1": 286.365, "r_y1": 131.90599999999995, "r_x2": 286.365, "r_y2": 123.35400000000004, "r_x3": 50.112, "r_y3": 123.35400000000004, "coord_origin": "TOPLEFT"}, "text": "In the case of IETD, this OCR engine is implicit in the de-", "orig": "In the case of IETD, this OCR engine is implicit in the de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 143.861, "r_x1": 286.365, "r_y1": 143.861, "r_x2": 286.365, "r_y2": 135.30899999999997, "r_x3": 50.112, "r_y3": 135.30899999999997, "coord_origin": "TOPLEFT"}, "text": "coder similar to [24]. For the IEDD, the OCR is solely em-", "orig": "coder similar to [24]. For the IEDD, the OCR is solely em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 155.81600000000003, "r_x1": 174.206, "r_y1": 155.81600000000003, "r_x2": 174.206, "r_y2": 147.264, "r_x3": 50.112, "r_y3": 147.264, "coord_origin": "TOPLEFT"}, "text": "bedded in the content-decoder.", "orig": "bedded in the content-decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 179.098, "r_y0": 155.81600000000003, "r_x1": 286.365, "r_y1": 155.81600000000003, "r_x2": 286.365, "r_y2": 147.264, "r_x3": 179.098, "r_y3": 147.264, "coord_origin": "TOPLEFT"}, "text": "This reliance on a custom,", "orig": "This reliance on a custom,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 167.77099999999996, "r_x1": 243.267, "r_y1": 167.77099999999996, "r_x2": 243.267, "r_y2": 159.21900000000005, "r_x3": 50.112, "r_y3": 159.21900000000005, "coord_origin": "TOPLEFT"}, "text": "implicit OCR decoder is of course problematic.", "orig": "implicit OCR decoder is of course problematic.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.437, "r_y0": 167.77099999999996, "r_x1": 286.365, "r_y1": 167.77099999999996, "r_x2": 286.365, "r_y2": 159.21900000000005, "r_x3": 248.437, "r_y3": 159.21900000000005, "coord_origin": "TOPLEFT"}, "text": "OCR is a", "orig": "OCR is a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 179.726, "r_x1": 286.365, "r_y1": 179.726, "r_x2": 286.365, "r_y2": 171.17399999999998, "r_x3": 50.112, "r_y3": 171.17399999999998, "coord_origin": "TOPLEFT"}, "text": "well known and extremely tough problem, that often needs", "orig": "well known and extremely tough problem, that often needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 191.68200000000002, "r_x1": 286.365, "r_y1": 191.68200000000002, "r_x2": 286.365, "r_y2": 183.13, "r_x3": 50.112, "r_y3": 183.13, "coord_origin": "TOPLEFT"}, "text": "custom training for each individual language. However, the", "orig": "custom training for each individual language. However, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 203.63699999999994, "r_x1": 126.655, "r_y1": 203.63699999999994, "r_x2": 126.655, "r_y2": 195.08500000000004, "r_x3": 50.112, "r_y3": 195.08500000000004, "coord_origin": "TOPLEFT"}, "text": "limited availability", "orig": "limited availability", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 130.59, "r_y0": 203.63699999999994, "r_x1": 142.206, "r_y1": 203.63699999999994, "r_x2": 142.206, "r_y2": 195.08500000000004, "r_x3": 130.59, "r_y3": 195.08500000000004, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 146.132, "r_y0": 203.63699999999994, "r_x1": 286.365, "r_y1": 203.63699999999994, "r_x2": 286.365, "r_y2": 195.08500000000004, "r_x3": 146.132, "r_y3": 195.08500000000004, "coord_origin": "TOPLEFT"}, "text": "non-english content in the current", "orig": "non-english content in the current", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 215.59199999999998, "r_x1": 286.365, "r_y1": 215.59199999999998, "r_x2": 286.365, "r_y2": 207.03999999999996, "r_x3": 50.112, "r_y3": 207.03999999999996, "coord_origin": "TOPLEFT"}, "text": "datasets, makes it impractical to apply the IETD and IEDD", "orig": "datasets, makes it impractical to apply the IETD and IEDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 227.54700000000003, "r_x1": 286.365, "r_y1": 227.54700000000003, "r_x2": 286.365, "r_y2": 218.995, "r_x3": 50.112, "r_y3": 218.995, "coord_origin": "TOPLEFT"}, "text": "methods on tables with other languages. Additionally, OCR", "orig": "methods on tables with other languages. Additionally, OCR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 239.50199999999995, "r_x1": 286.365, "r_y1": 239.50199999999995, "r_x2": 286.365, "r_y2": 230.95000000000005, "r_x3": 50.112, "r_y3": 230.95000000000005, "coord_origin": "TOPLEFT"}, "text": "can be completely omitted if the tables originate from pro-", "orig": "can be completely omitted if the tables originate from pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 251.457, "r_x1": 286.365, "r_y1": 251.457, "r_x2": 286.365, "r_y2": 242.90499999999997, "r_x3": 50.112, "r_y3": 242.90499999999997, "coord_origin": "TOPLEFT"}, "text": "grammatic PDF documents with known positions of each", "orig": "grammatic PDF documents with known positions of each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 263.413, "r_x1": 66.989, "r_y1": 263.413, "r_x2": 66.989, "r_y2": 254.861, "r_x3": 50.112, "r_y3": 254.861, "coord_origin": "TOPLEFT"}, "text": "cell.", "orig": "cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 71.382, "r_y0": 263.413, "r_x1": 286.365, "r_y1": 263.413, "r_x2": 286.365, "r_y2": 254.861, "r_x3": 71.382, "r_y3": 254.861, "coord_origin": "TOPLEFT"}, "text": "The latter was the inspiration for the work of this pa-", "orig": "The latter was the inspiration for the work of this pa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 275.36800000000005, "r_x1": 64.777, "r_y1": 275.36800000000005, "r_x2": 64.777, "r_y2": 266.81600000000003, "r_x3": 50.112, "r_y3": 266.81600000000003, "coord_origin": "TOPLEFT"}, "text": "per.", "orig": "per.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In practice, both network architectures (IETD and IEDD) require an implicit, custom trained object-characterrecognition (OCR) to obtain the content of the table-cells. In the case of IETD, this OCR engine is implicit in the decoder similar to [24]. For the IEDD, the OCR is solely embedded in the content-decoder. This reliance on a custom, implicit OCR decoder is of course problematic. OCR is a well known and extremely tough problem, that often needs custom training for each individual language. However, the limited availability for non-english content in the current datasets, makes it impractical to apply the IETD and IEDD methods on tables with other languages. Additionally, OCR can be completely omitted if the tables originate from programmatic PDF documents with known positions of each cell. The latter was the inspiration for the work of this paper."}, {"label": "text", "id": 0, "page_no": 2, "cluster": {"id": 0, "label": "text", "bbox": {"l": 50.112, "t": 278.43899999999996, "r": 286.365, "b": 490.617, "coord_origin": "TOPLEFT"}, "confidence": 0.9878450036048889, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 287.395, "r_x1": 90.301, "r_y1": 287.395, "r_x2": 90.301, "r_y2": 278.43899999999996, "r_x3": 62.067, "r_y3": 278.43899999999996, "coord_origin": "TOPLEFT"}, "text": "Graph", "orig": "Graph", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.677, "r_y0": 287.395, "r_x1": 126.007, "r_y1": 287.395, "r_x2": 126.007, "r_y2": 278.43899999999996, "r_x3": 96.677, "r_y3": 278.43899999999996, "coord_origin": "TOPLEFT"}, "text": "Neural", "orig": "Neural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.373, "r_y0": 287.395, "r_x1": 171.566, "r_y1": 287.395, "r_x2": 171.566, "r_y2": 278.43899999999996, "r_x3": 132.373, "r_y3": 278.43899999999996, "coord_origin": "TOPLEFT"}, "text": "networks", "orig": "networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.568, "r_y0": 287.379, "r_x1": 174.338, "r_y1": 287.379, "r_x2": 174.338, "r_y2": 278.827, "r_x3": 171.568, "r_y3": 278.827, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.187, "r_y0": 287.379, "r_x1": 210.083, "r_y1": 287.379, "r_x2": 210.083, "r_y2": 278.827, "r_x3": 185.187, "r_y3": 278.827, "coord_origin": "TOPLEFT"}, "text": "Graph", "orig": "Graph", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.459, "r_y0": 287.379, "r_x1": 243.568, "r_y1": 287.379, "r_x2": 243.568, "r_y2": 278.827, "r_x3": 216.459, "r_y3": 278.827, "coord_origin": "TOPLEFT"}, "text": "Neural", "orig": "Neural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.944, "r_y0": 287.379, "r_x1": 286.357, "r_y1": 287.379, "r_x2": 286.357, "r_y2": 278.827, "r_x3": 249.944, "r_y3": 278.827, "coord_origin": "TOPLEFT"}, "text": "networks", "orig": "networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 299.335, "r_x1": 84.971, "r_y1": 299.335, "r_x2": 84.971, "r_y2": 290.783, "r_x3": 50.112, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "(GNN's)", "orig": "(GNN's)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.347, "r_y0": 299.335, "r_x1": 107.845, "r_y1": 299.335, "r_x2": 107.845, "r_y2": 290.783, "r_x3": 91.347, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "take", "orig": "take", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 114.211, "r_y0": 299.335, "r_x1": 118.635, "r_y1": 299.335, "r_x2": 118.635, "r_y2": 290.783, "r_x3": 114.211, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.011, "r_y0": 299.335, "r_x1": 159.87, "r_y1": 299.335, "r_x2": 159.87, "r_y2": 290.783, "r_x3": 125.011, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "radically", "orig": "radically", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.246, "r_y0": 299.335, "r_x1": 200.298, "r_y1": 299.335, "r_x2": 200.298, "r_y2": 290.783, "r_x3": 166.246, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "different", "orig": "different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.664, "r_y0": 299.335, "r_x1": 243.177, "r_y1": 299.335, "r_x2": 243.177, "r_y2": 290.783, "r_x3": 206.664, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "approach", "orig": "approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.553, "r_y0": 299.335, "r_x1": 257.304, "r_y1": 299.335, "r_x2": 257.304, "r_y2": 290.783, "r_x3": 249.553, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.68, "r_y0": 299.335, "r_x1": 286.365, "r_y1": 299.335, "r_x2": 286.365, "r_y2": 290.783, "r_x3": 263.68, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "table-", "orig": "table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 311.29, "r_x1": 84.971, "r_y1": 311.29, "r_x2": 84.971, "r_y2": 302.738, "r_x3": 50.112, "r_y3": 302.738, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.986, "r_y0": 311.29, "r_x1": 131.168, "r_y1": 311.29, "r_x2": 131.168, "r_y2": 302.738, "r_x3": 88.986, "r_y3": 302.738, "coord_origin": "TOPLEFT"}, "text": "extraction.", "orig": "extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.849, "r_y0": 311.29, "r_x1": 286.365, "r_y1": 311.29, "r_x2": 286.365, "r_y2": 302.738, "r_x3": 138.849, "r_y3": 302.738, "coord_origin": "TOPLEFT"}, "text": "Note that one table cell can consti-", "orig": "Note that one table cell can consti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 323.245, "r_x1": 286.365, "r_y1": 323.245, "r_x2": 286.365, "r_y2": 314.693, "r_x3": 50.112, "r_y3": 314.693, "coord_origin": "TOPLEFT"}, "text": "tute out of multiple text-cells. To obtain the table-structure,", "orig": "tute out of multiple text-cells. To obtain the table-structure,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 335.2, "r_x1": 136.996, "r_y1": 335.2, "r_x2": 136.996, "r_y2": 326.648, "r_x3": 50.112, "r_y3": 326.648, "coord_origin": "TOPLEFT"}, "text": "one creates an initial", "orig": "one creates an initial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.051, "r_y0": 335.2, "r_x1": 166.226, "r_y1": 335.2, "r_x2": 166.226, "r_y2": 326.648, "r_x3": 141.051, "r_y3": 326.648, "coord_origin": "TOPLEFT"}, "text": "graph,", "orig": "graph,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.679, "r_y0": 335.2, "r_x1": 286.365, "r_y1": 335.2, "r_x2": 286.365, "r_y2": 326.648, "r_x3": 170.679, "r_y3": 326.648, "coord_origin": "TOPLEFT"}, "text": "where each of the text-cells", "orig": "where each of the text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 347.155, "r_x1": 260.442, "r_y1": 347.155, "r_x2": 260.442, "r_y2": 338.603, "r_x3": 50.112, "r_y3": 338.603, "coord_origin": "TOPLEFT"}, "text": "becomes a node in the graph similar to [33, 34, 2].", "orig": "becomes a node in the graph similar to [33, 34, 2].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.45, "r_y0": 347.155, "r_x1": 286.365, "r_y1": 347.155, "r_x2": 286.365, "r_y2": 338.603, "r_x3": 266.45, "r_y3": 338.603, "coord_origin": "TOPLEFT"}, "text": "Each", "orig": "Each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 359.11, "r_x1": 286.365, "r_y1": 359.11, "r_x2": 286.365, "r_y2": 350.558, "r_x3": 50.112, "r_y3": 350.558, "coord_origin": "TOPLEFT"}, "text": "node is then associated with en embedding vector coming", "orig": "node is then associated with en embedding vector coming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 371.066, "r_x1": 286.365, "r_y1": 371.066, "r_x2": 286.365, "r_y2": 362.514, "r_x3": 50.112, "r_y3": 362.514, "coord_origin": "TOPLEFT"}, "text": "from the encoded image, its coordinates and the encoded", "orig": "from the encoded image, its coordinates and the encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 383.021, "r_x1": 67.397, "r_y1": 383.021, "r_x2": 67.397, "r_y2": 374.469, "r_x3": 50.112, "r_y3": 374.469, "coord_origin": "TOPLEFT"}, "text": "text.", "orig": "text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 72.976, "r_y0": 383.021, "r_x1": 286.365, "r_y1": 383.021, "r_x2": 286.365, "r_y2": 374.469, "r_x3": 72.976, "r_y3": 374.469, "coord_origin": "TOPLEFT"}, "text": "Furthermore, nodes that represent adjacent text-cells", "orig": "Furthermore, nodes that represent adjacent text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 394.976, "r_x1": 92.602, "r_y1": 394.976, "r_x2": 92.602, "r_y2": 386.424, "r_x3": 50.112, "r_y3": 386.424, "coord_origin": "TOPLEFT"}, "text": "are linked.", "orig": "are linked.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 97.305, "r_y0": 394.976, "r_x1": 286.365, "r_y1": 394.976, "r_x2": 286.365, "r_y2": 386.424, "r_x3": 97.305, "r_y3": 386.424, "coord_origin": "TOPLEFT"}, "text": "Graph Convolutional Networks (GCN's) based", "orig": "Graph Convolutional Networks (GCN's) based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 406.931, "r_x1": 286.365, "r_y1": 406.931, "r_x2": 286.365, "r_y2": 398.379, "r_x3": 50.112, "r_y3": 398.379, "coord_origin": "TOPLEFT"}, "text": "methods take the image as an input, but also the position of", "orig": "methods take the image as an input, but also the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 418.886, "r_x1": 286.365, "r_y1": 418.886, "r_x2": 286.365, "r_y2": 410.334, "r_x3": 50.112, "r_y3": 410.334, "coord_origin": "TOPLEFT"}, "text": "the text-cells and their content [18]. The purpose of a GCN", "orig": "the text-cells and their content [18]. The purpose of a GCN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 430.841, "r_x1": 286.365, "r_y1": 430.841, "r_x2": 286.365, "r_y2": 422.289, "r_x3": 50.112, "r_y3": 422.289, "coord_origin": "TOPLEFT"}, "text": "is to transform the input graph into a new graph, which re-", "orig": "is to transform the input graph into a new graph, which re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 442.797, "r_x1": 198.236, "r_y1": 442.797, "r_x2": 198.236, "r_y2": 434.245, "r_x3": 50.112, "r_y3": 434.245, "coord_origin": "TOPLEFT"}, "text": "places the old links with new ones.", "orig": "places the old links with new ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 205.927, "r_y0": 442.797, "r_x1": 286.365, "r_y1": 442.797, "r_x2": 286.365, "r_y2": 434.245, "r_x3": 205.927, "r_y3": 434.245, "coord_origin": "TOPLEFT"}, "text": "The new links then", "orig": "The new links then", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 454.752, "r_x1": 165.618, "r_y1": 454.752, "r_x2": 165.618, "r_y2": 446.2, "r_x3": 50.112, "r_y3": 446.2, "coord_origin": "TOPLEFT"}, "text": "represent the table-structure.", "orig": "represent the table-structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.417, "r_y0": 454.752, "r_x1": 286.365, "r_y1": 454.752, "r_x2": 286.365, "r_y2": 446.2, "r_x3": 171.417, "r_y3": 446.2, "coord_origin": "TOPLEFT"}, "text": "With this approach, one can", "orig": "With this approach, one can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 466.707, "r_x1": 242.36, "r_y1": 466.707, "r_x2": 242.36, "r_y2": 458.155, "r_x3": 50.112, "r_y3": 458.155, "coord_origin": "TOPLEFT"}, "text": "avoid the need to build custom OCR decoders.", "orig": "avoid the need to build custom OCR decoders.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.408, "r_y0": 466.707, "r_x1": 286.365, "r_y1": 466.707, "r_x2": 286.365, "r_y2": 458.155, "r_x3": 248.408, "r_y3": 458.155, "coord_origin": "TOPLEFT"}, "text": "However,", "orig": "However,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 478.662, "r_x1": 286.365, "r_y1": 478.662, "r_x2": 286.365, "r_y2": 470.11, "r_x3": 50.112, "r_y3": 470.11, "coord_origin": "TOPLEFT"}, "text": "the quality of the reconstructed structure is not comparable", "orig": "the quality of the reconstructed structure is not comparable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 490.617, "r_x1": 186.5, "r_y1": 490.617, "r_x2": 186.5, "r_y2": 482.065, "r_x3": 50.112, "r_y3": 482.065, "coord_origin": "TOPLEFT"}, "text": "to the current state-of-the-art [18].", "orig": "to the current state-of-the-art [18].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Graph Neural networks : Graph Neural networks (GNN's) take a radically different approach to tablestructure extraction. Note that one table cell can constitute out of multiple text-cells. To obtain the table-structure, one creates an initial graph, where each of the text-cells becomes a node in the graph similar to [33, 34, 2]. Each node is then associated with en embedding vector coming from the encoded image, its coordinates and the encoded text. Furthermore, nodes that represent adjacent text-cells are linked. Graph Convolutional Networks (GCN's) based methods take the image as an input, but also the position of the text-cells and their content [18]. The purpose of a GCN is to transform the input graph into a new graph, which replaces the old links with new ones. The new links then represent the table-structure. With this approach, one can avoid the need to build custom OCR decoders. However, the quality of the reconstructed structure is not comparable to the current state-of-the-art [18]."}, {"label": "text", "id": 1, "page_no": 2, "cluster": {"id": 1, "label": "text", "bbox": {"l": 50.112, "t": 493.689, "r": 286.366, "b": 622.181, "coord_origin": "TOPLEFT"}, "confidence": 0.9875094294548035, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 502.645, "r_x1": 252.881, "r_y1": 502.645, "r_x2": 252.881, "r_y2": 493.689, "r_x3": 62.067, "r_y3": 493.689, "coord_origin": "TOPLEFT"}, "text": "Hybrid Deep Learning-Rule-Based approach", "orig": "Hybrid Deep Learning-Rule-Based approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 252.882, "r_y0": 502.629, "r_x1": 255.652, "r_y1": 502.629, "r_x2": 255.652, "r_y2": 494.077, "r_x3": 252.882, "r_y3": 494.077, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 258.63, "r_y0": 502.629, "r_x1": 286.366, "r_y1": 502.629, "r_x2": 286.366, "r_y2": 494.077, "r_x3": 258.63, "r_y3": 494.077, "coord_origin": "TOPLEFT"}, "text": "Apop-", "orig": "Apop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 514.5840000000001, "r_x1": 286.365, "r_y1": 514.5840000000001, "r_x2": 286.365, "r_y2": 506.032, "r_x3": 50.112, "r_y3": 506.032, "coord_origin": "TOPLEFT"}, "text": "ular current model for table-structure identification is the", "orig": "ular current model for table-structure identification is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 526.539, "r_x1": 286.365, "r_y1": 526.539, "r_x2": 286.365, "r_y2": 517.9870000000001, "r_x3": 50.112, "r_y3": 517.9870000000001, "coord_origin": "TOPLEFT"}, "text": "use of a hybrid Deep Learning-Rule-Based approach similar", "orig": "use of a hybrid Deep Learning-Rule-Based approach similar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 538.494, "r_x1": 286.365, "r_y1": 538.494, "r_x2": 286.365, "r_y2": 529.942, "r_x3": 50.112, "r_y3": 529.942, "coord_origin": "TOPLEFT"}, "text": "to [27, 29]. In this approach, one first detects the position of", "orig": "to [27, 29]. In this approach, one first detects the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 550.45, "r_x1": 286.365, "r_y1": 550.45, "r_x2": 286.365, "r_y2": 541.898, "r_x3": 50.112, "r_y3": 541.898, "coord_origin": "TOPLEFT"}, "text": "the table-cells with object detection (e.g. YoloVx or Mask-", "orig": "the table-cells with object detection (e.g. YoloVx or Mask-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 562.405, "r_x1": 286.365, "r_y1": 562.405, "r_x2": 286.365, "r_y2": 553.8530000000001, "r_x3": 50.112, "r_y3": 553.8530000000001, "coord_origin": "TOPLEFT"}, "text": "RCNN), then classifies the table into different types (from", "orig": "RCNN), then classifies the table into different types (from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 574.36, "r_x1": 59.527, "r_y1": 574.36, "r_x2": 59.527, "r_y2": 565.808, "r_x3": 50.112, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "its", "orig": "its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 64.259, "r_y0": 574.36, "r_x1": 95.8, "r_y1": 574.36, "r_x2": 95.8, "r_y2": 565.808, "r_x3": 64.259, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "images)", "orig": "images)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 100.523, "r_y0": 574.36, "r_x1": 145.105, "r_y1": 574.36, "r_x2": 145.105, "r_y2": 565.808, "r_x3": 100.523, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "and finally", "orig": "and finally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.828, "r_y0": 574.36, "r_x1": 166.983, "r_y1": 574.36, "r_x2": 166.983, "r_y2": 565.808, "r_x3": 149.828, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "uses", "orig": "uses", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.715, "r_y0": 574.36, "r_x1": 205.768, "r_y1": 574.36, "r_x2": 205.768, "r_y2": 565.808, "r_x3": 171.715, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "different", "orig": "different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.5, "r_y0": 574.36, "r_x1": 244.243, "r_y1": 574.36, "r_x2": 244.243, "r_y2": 565.808, "r_x3": 210.5, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "rule-sets", "orig": "rule-sets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.975, "r_y0": 574.36, "r_x1": 256.726, "r_y1": 574.36, "r_x2": 256.726, "r_y2": 565.808, "r_x3": 248.975, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 261.459, "r_y0": 574.36, "r_x1": 286.365, "r_y1": 574.36, "r_x2": 286.365, "r_y2": 565.808, "r_x3": 261.459, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "obtain", "orig": "obtain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 586.315, "r_x1": 122.64, "r_y1": 586.315, "r_x2": 122.64, "r_y2": 577.763, "r_x3": 50.112, "r_y3": 577.763, "coord_origin": "TOPLEFT"}, "text": "its table-structure.", "orig": "its table-structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 127.482, "r_y0": 586.315, "r_x1": 286.365, "r_y1": 586.315, "r_x2": 286.365, "r_y2": 577.763, "r_x3": 127.482, "r_y3": 577.763, "coord_origin": "TOPLEFT"}, "text": "Currently, this approach achieves state-", "orig": "Currently, this approach achieves state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 598.27, "r_x1": 87.731, "r_y1": 598.27, "r_x2": 87.731, "r_y2": 589.718, "r_x3": 50.112, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "of-the-art", "orig": "of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.074, "r_y0": 598.27, "r_x1": 120.577, "r_y1": 598.27, "r_x2": 120.577, "r_y2": 589.718, "r_x3": 92.074, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "results,", "orig": "results,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.389, "r_y0": 598.27, "r_x1": 137.922, "r_y1": 598.27, "r_x2": 137.922, "r_y2": 589.718, "r_x3": 125.389, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "but", "orig": "but", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.266, "r_y0": 598.27, "r_x1": 148.911, "r_y1": 598.27, "r_x2": 148.911, "r_y2": 589.718, "r_x3": 142.266, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.255, "r_y0": 598.27, "r_x1": 165.987, "r_y1": 598.27, "r_x2": 165.987, "r_y2": 589.718, "r_x3": 153.255, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "not", "orig": "not", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.331, "r_y0": 598.27, "r_x1": 286.365, "r_y1": 598.27, "r_x2": 286.365, "r_y2": 589.718, "r_x3": 170.331, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "an end-to-end deep-learning", "orig": "an end-to-end deep-learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 610.225, "r_x1": 82.49, "r_y1": 610.225, "r_x2": 82.49, "r_y2": 601.673, "r_x3": 50.112, "r_y3": 601.673, "coord_origin": "TOPLEFT"}, "text": "method.", "orig": "method.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.173, "r_y0": 610.225, "r_x1": 286.365, "r_y1": 610.225, "r_x2": 286.365, "r_y2": 601.673, "r_x3": 87.173, "r_y3": 601.673, "coord_origin": "TOPLEFT"}, "text": "As such, new rules need to be written if different", "orig": "As such, new rules need to be written if different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 622.181, "r_x1": 175.989, "r_y1": 622.181, "r_x2": 175.989, "r_y2": 613.629, "r_x3": 50.112, "r_y3": 613.629, "coord_origin": "TOPLEFT"}, "text": "types of tables are encountered.", "orig": "types of tables are encountered.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Hybrid Deep Learning-Rule-Based approach : Apopular current model for table-structure identification is the use of a hybrid Deep Learning-Rule-Based approach similar to [27, 29]. In this approach, one first detects the position of the table-cells with object detection (e.g. YoloVx or MaskRCNN), then classifies the table into different types (from its images) and finally uses different rule-sets to obtain its table-structure. Currently, this approach achieves stateof-the-art results, but is not an end-to-end deep-learning method. As such, new rules need to be written if different types of tables are encountered."}, {"label": "section_header", "id": 8, "page_no": 2, "cluster": {"id": 8, "label": "section_header", "bbox": {"l": 50.112, "t": 635.9449999999999, "r": 105.225, "b": 646.693, "coord_origin": "TOPLEFT"}, "confidence": 0.9423062205314636, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 646.693, "r_x1": 105.225, "r_y1": 646.693, "r_x2": 105.225, "r_y2": 635.9449999999999, "r_x3": 50.112, "r_y3": 635.9449999999999, "coord_origin": "TOPLEFT"}, "text": "3. Datasets", "orig": "3. Datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3. Datasets"}, {"label": "text", "id": 3, "page_no": 2, "cluster": {"id": 3, "label": "text", "bbox": {"l": 50.112, "t": 656.694, "r": 286.365, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9862047433853149, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 665.246, "r_x1": 286.365, "r_y1": 665.246, "r_x2": 286.365, "r_y2": 656.694, "r_x3": 62.067, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "We rely on large-scale datasets such as PubTabNet [37],", "orig": "We rely on large-scale datasets such as PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.201, "r_x1": 286.365, "r_y1": 677.201, "r_x2": 286.365, "r_y2": 668.649, "r_x3": 50.112, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "FinTabNet [36], and TableBank [17] datasets to train and", "orig": "FinTabNet [36], and TableBank [17] datasets to train and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 133.479, "r_y1": 689.156, "r_x2": 133.479, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "evaluate our models.", "orig": "evaluate our models.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.271, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 138.271, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "These datasets span over various ap-", "orig": "These datasets span over various ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 166.246, "r_y1": 701.111, "r_x2": 166.246, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "pearance styles and content.", "orig": "pearance styles and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 173.688, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 173.688, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "We also introduce our own", "orig": "We also introduce our own", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "synthetically generated SynthTabNet dataset to fix an im-", "orig": "synthetically generated SynthTabNet dataset to fix an im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We rely on large-scale datasets such as PubTabNet [37], FinTabNet [36], and TableBank [17] datasets to train and evaluate our models. These datasets span over various appearance styles and content. We also introduce our own synthetically generated SynthTabNet dataset to fix an im-"}, {"label": "picture", "id": 6, "page_no": 2, "cluster": {"id": 6, "label": "picture", "bbox": {"l": 312.10369873046875, "t": 78.44086456298828, "r": 550.38916015625, "b": 250.60984802246094, "coord_origin": "TOPLEFT"}, "confidence": 0.9746918082237244, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.799, "r_y0": 88.46699999999998, "r_x1": 486.849, "r_y1": 88.46699999999998, "r_x2": 486.849, "r_y2": 80.154, "r_x3": 380.799, "r_y3": 80.154, "coord_origin": "TOPLEFT"}, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.768, "r_y0": 250.68200000000002, "r_x1": 469.787, "r_y1": 250.68200000000002, "r_x2": 469.787, "r_y2": 242.36900000000003, "r_x3": 396.768, "r_y3": 242.36900000000003, "coord_origin": "TOPLEFT"}, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.977, "r_y0": 239.19299999999998, "r_x1": 324.793, "r_y1": 239.19299999999998, "r_x2": 324.793, "r_y2": 233.65099999999995, "r_x3": 320.977, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.483, "r_y0": 239.19299999999998, "r_x1": 418.113, "r_y1": 239.19299999999998, "r_x2": 418.113, "r_y2": 233.65099999999995, "r_x3": 410.483, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.85, "r_y0": 239.19299999999998, "r_x1": 508.48, "r_y1": 239.19299999999998, "r_x2": 508.48, "r_y2": 233.65099999999995, "r_x3": 500.85, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.3, "r_y0": 239.19299999999998, "r_x1": 372.93, "r_y1": 239.19299999999998, "r_x2": 372.93, "r_y2": 233.65099999999995, "r_x3": 365.3, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.666, "r_y0": 239.19299999999998, "r_x1": 463.296, "r_y1": 239.19299999999998, "r_x2": 463.296, "r_y2": 233.65099999999995, "r_x3": 455.666, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 542.035, "r_y0": 239.19299999999998, "r_x1": 549.665, "r_y1": 239.19299999999998, "r_x2": 549.665, "r_y2": 233.65099999999995, "r_x3": 542.035, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 316.045, "r_y0": 236.21699999999998, "r_x1": 319.861, "r_y1": 236.21699999999998, "r_x2": 319.861, "r_y2": 230.67399999999998, "r_x3": 316.045, "r_y3": 230.67399999999998, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.625, "r_y0": 204.461, "r_x1": 320.255, "r_y1": 204.461, "r_x2": 320.255, "r_y2": 198.91899999999998, "r_x3": 312.625, "r_y3": 198.91899999999998, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.15, "r_y0": 173.86800000000005, "r_x1": 320.78, "r_y1": 173.86800000000005, "r_x2": 320.78, "r_y2": 168.32600000000002, "r_x3": 313.15, "r_y3": 168.32600000000002, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.93, "r_y0": 142.35799999999995, "r_x1": 320.56, "r_y1": 142.35799999999995, "r_x2": 320.56, "r_y2": 136.81600000000003, "r_x3": 312.93, "r_y3": 136.81600000000003, "coord_origin": "TOPLEFT"}, "text": "60", "orig": "60", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.482, "r_y0": 111.37199999999996, "r_x1": 320.112, "r_y1": 111.37199999999996, "r_x2": 320.112, "r_y2": 105.83000000000004, "r_x3": 312.482, "r_y3": 105.83000000000004, "coord_origin": "TOPLEFT"}, "text": "80", "orig": "80", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.482, "r_y0": 218.02999999999997, "r_x1": 320.112, "r_y1": 218.02999999999997, "r_x2": 320.112, "r_y2": 212.48699999999997, "r_x3": 312.482, "r_y3": 212.48699999999997, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.076, "r_y0": 189.49199999999996, "r_x1": 320.707, "r_y1": 189.49199999999996, "r_x2": 320.707, "r_y2": 183.95000000000005, "r_x3": 313.076, "r_y3": 183.95000000000005, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.763, "r_y0": 158.24400000000003, "r_x1": 320.393, "r_y1": 158.24400000000003, "r_x2": 320.393, "r_y2": 152.702, "r_x3": 312.763, "r_y3": 152.702, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.198, "r_y0": 126.34100000000001, "r_x1": 319.828, "r_y1": 126.34100000000001, "r_x2": 319.828, "r_y2": 120.798, "r_x3": 312.198, "r_y3": 120.798, "coord_origin": "TOPLEFT"}, "text": "70", "orig": "70", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.817, "r_y0": 95.87900000000002, "r_x1": 320.447, "r_y1": 95.87900000000002, "r_x2": 320.447, "r_y2": 90.33699999999999, "r_x3": 312.817, "r_y3": 90.33699999999999, "coord_origin": "TOPLEFT"}, "text": "90", "orig": "90", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.174, "r_y0": 229.94000000000005, "r_x1": 536.944, "r_y1": 229.94000000000005, "r_x2": 536.944, "r_y2": 223.01199999999994, "r_x3": 532.174, "r_y3": 223.01199999999994, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.88, "r_y0": 115.48000000000002, "r_x1": 547.613, "r_y1": 115.48000000000002, "r_x2": 547.613, "r_y2": 108.55200000000002, "r_x3": 532.88, "r_y3": 108.55200000000002, "coord_origin": "TOPLEFT"}, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.774, "r_y0": 137.99400000000003, "r_x1": 542.739, "r_y1": 137.99400000000003, "r_x2": 542.739, "r_y2": 131.06600000000003, "r_x3": 532.774, "r_y3": 131.06600000000003, "coord_origin": "TOPLEFT"}, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.799, "r_y0": 161.13599999999997, "r_x1": 542.764, "r_y1": 161.13599999999997, "r_x2": 542.764, "r_y2": 154.20799999999997, "r_x3": 532.799, "r_y3": 154.20799999999997, "coord_origin": "TOPLEFT"}, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.571, "r_y0": 183.971, "r_x1": 542.536, "r_y1": 183.971, "r_x2": 542.536, "r_y2": 177.043, "r_x3": 532.571, "r_y3": 177.043, "coord_origin": "TOPLEFT"}, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.146, "r_y0": 206.85900000000004, "r_x1": 542.111, "r_y1": 206.85900000000004, "r_x2": 542.111, "r_y2": 199.93100000000004, "r_x3": 532.146, "r_y3": 199.93100000000004, "coord_origin": "TOPLEFT"}, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 12, "label": "section_header", "bbox": {"l": 380.799, "t": 80.154, "r": 486.849, "b": 88.46699999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.5687217116355896, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.799, "r_y0": 88.46699999999998, "r_x1": 486.849, "r_y1": 88.46699999999998, "r_x2": 486.849, "r_y2": 80.154, "r_x3": 380.799, "r_y3": 80.154, "coord_origin": "TOPLEFT"}, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 396.768, "t": 242.36900000000003, "r": 469.787, "b": 250.68200000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.768, "r_y0": 250.68200000000002, "r_x1": 469.787, "r_y1": 250.68200000000002, "r_x2": 469.787, "r_y2": 242.36900000000003, "r_x3": 396.768, "r_y3": 242.36900000000003, "coord_origin": "TOPLEFT"}, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "text", "bbox": {"l": 320.977, "t": 233.65099999999995, "r": 324.793, "b": 239.19299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.977, "r_y0": 239.19299999999998, "r_x1": 324.793, "r_y1": 239.19299999999998, "r_x2": 324.793, "r_y2": 233.65099999999995, "r_x3": 320.977, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 410.483, "t": 233.65099999999995, "r": 418.113, "b": 239.19299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.483, "r_y0": 239.19299999999998, "r_x1": 418.113, "r_y1": 239.19299999999998, "r_x2": 418.113, "r_y2": 233.65099999999995, "r_x3": 410.483, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 500.85, "t": 233.65099999999995, "r": 508.48, "b": 239.19299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.85, "r_y0": 239.19299999999998, "r_x1": 508.48, "r_y1": 239.19299999999998, "r_x2": 508.48, "r_y2": 233.65099999999995, "r_x3": 500.85, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 365.3, "t": 233.65099999999995, "r": 372.93, "b": 239.19299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.3, "r_y0": 239.19299999999998, "r_x1": 372.93, "r_y1": 239.19299999999998, "r_x2": 372.93, "r_y2": 233.65099999999995, "r_x3": 365.3, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 455.666, "t": 233.65099999999995, "r": 463.296, "b": 239.19299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.666, "r_y0": 239.19299999999998, "r_x1": 463.296, "r_y1": 239.19299999999998, "r_x2": 463.296, "r_y2": 233.65099999999995, "r_x3": 455.666, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 542.035, "t": 233.65099999999995, "r": 549.665, "b": 239.19299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 542.035, "r_y0": 239.19299999999998, "r_x1": 549.665, "r_y1": 239.19299999999998, "r_x2": 549.665, "r_y2": 233.65099999999995, "r_x3": 542.035, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 316.045, "t": 230.67399999999998, "r": 319.861, "b": 236.21699999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 316.045, "r_y0": 236.21699999999998, "r_x1": 319.861, "r_y1": 236.21699999999998, "r_x2": 319.861, "r_y2": 230.67399999999998, "r_x3": 316.045, "r_y3": 230.67399999999998, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 312.625, "t": 198.91899999999998, "r": 320.255, "b": 204.461, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.625, "r_y0": 204.461, "r_x1": 320.255, "r_y1": 204.461, "r_x2": 320.255, "r_y2": 198.91899999999998, "r_x3": 312.625, "r_y3": 198.91899999999998, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 313.15, "t": 168.32600000000002, "r": 320.78, "b": 173.86800000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.15, "r_y0": 173.86800000000005, "r_x1": 320.78, "r_y1": 173.86800000000005, "r_x2": 320.78, "r_y2": 168.32600000000002, "r_x3": 313.15, "r_y3": 168.32600000000002, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 312.93, "t": 136.81600000000003, "r": 320.56, "b": 142.35799999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.93, "r_y0": 142.35799999999995, "r_x1": 320.56, "r_y1": 142.35799999999995, "r_x2": 320.56, "r_y2": 136.81600000000003, "r_x3": 312.93, "r_y3": 136.81600000000003, "coord_origin": "TOPLEFT"}, "text": "60", "orig": "60", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 312.482, "t": 105.83000000000004, "r": 320.112, "b": 111.37199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.482, "r_y0": 111.37199999999996, "r_x1": 320.112, "r_y1": 111.37199999999996, "r_x2": 320.112, "r_y2": 105.83000000000004, "r_x3": 312.482, "r_y3": 105.83000000000004, "coord_origin": "TOPLEFT"}, "text": "80", "orig": "80", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 312.482, "t": 212.48699999999997, "r": 320.112, "b": 218.02999999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.482, "r_y0": 218.02999999999997, "r_x1": 320.112, "r_y1": 218.02999999999997, "r_x2": 320.112, "r_y2": 212.48699999999997, "r_x3": 312.482, "r_y3": 212.48699999999997, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 313.076, "t": 183.95000000000005, "r": 320.707, "b": 189.49199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.076, "r_y0": 189.49199999999996, "r_x1": 320.707, "r_y1": 189.49199999999996, "r_x2": 320.707, "r_y2": 183.95000000000005, "r_x3": 313.076, "r_y3": 183.95000000000005, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 312.763, "t": 152.702, "r": 320.393, "b": 158.24400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.763, "r_y0": 158.24400000000003, "r_x1": 320.393, "r_y1": 158.24400000000003, "r_x2": 320.393, "r_y2": 152.702, "r_x3": 312.763, "r_y3": 152.702, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 312.198, "t": 120.798, "r": 319.828, "b": 126.34100000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.198, "r_y0": 126.34100000000001, "r_x1": 319.828, "r_y1": 126.34100000000001, "r_x2": 319.828, "r_y2": 120.798, "r_x3": 312.198, "r_y3": 120.798, "coord_origin": "TOPLEFT"}, "text": "70", "orig": "70", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 312.817, "t": 90.33699999999999, "r": 320.447, "b": 95.87900000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.817, "r_y0": 95.87900000000002, "r_x1": 320.447, "r_y1": 95.87900000000002, "r_x2": 320.447, "r_y2": 90.33699999999999, "r_x3": 312.817, "r_y3": 90.33699999999999, "coord_origin": "TOPLEFT"}, "text": "90", "orig": "90", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 532.174, "t": 223.01199999999994, "r": 536.944, "b": 229.94000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.174, "r_y0": 229.94000000000005, "r_x1": 536.944, "r_y1": 229.94000000000005, "r_x2": 536.944, "r_y2": 223.01199999999994, "r_x3": 532.174, "r_y3": 223.01199999999994, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 532.88, "t": 108.55200000000002, "r": 547.613, "b": 115.48000000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.88, "r_y0": 115.48000000000002, "r_x1": 547.613, "r_y1": 115.48000000000002, "r_x2": 547.613, "r_y2": 108.55200000000002, "r_x3": 532.88, "r_y3": 108.55200000000002, "coord_origin": "TOPLEFT"}, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 532.774, "t": 131.06600000000003, "r": 542.739, "b": 137.99400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.774, "r_y0": 137.99400000000003, "r_x1": 542.739, "r_y1": 137.99400000000003, "r_x2": 542.739, "r_y2": 131.06600000000003, "r_x3": 532.774, "r_y3": 131.06600000000003, "coord_origin": "TOPLEFT"}, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 532.799, "t": 154.20799999999997, "r": 542.764, "b": 161.13599999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.799, "r_y0": 161.13599999999997, "r_x1": 542.764, "r_y1": 161.13599999999997, "r_x2": 542.764, "r_y2": 154.20799999999997, "r_x3": 532.799, "r_y3": 154.20799999999997, "coord_origin": "TOPLEFT"}, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 532.571, "t": 177.043, "r": 542.536, "b": 183.971, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.571, "r_y0": 183.971, "r_x1": 542.536, "r_y1": 183.971, "r_x2": 542.536, "r_y2": 177.043, "r_x3": 532.571, "r_y3": 177.043, "coord_origin": "TOPLEFT"}, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 532.146, "t": 199.93100000000004, "r": 542.111, "b": 206.85900000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.146, "r_y0": 206.85900000000004, "r_x1": 542.111, "r_y1": 206.85900000000004, "r_x2": 542.111, "r_y2": 199.93100000000004, "r_x3": 532.146, "r_y3": 199.93100000000004, "coord_origin": "TOPLEFT"}, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "caption", "id": 7, "page_no": 2, "cluster": {"id": 7, "label": "caption", "bbox": {"l": 308.862, "t": 268.105, "r": 545.115, "b": 288.612, "coord_origin": "TOPLEFT"}, "confidence": 0.9667505025863647, "cells": [{"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 276.65700000000004, "r_x1": 346.062, "r_y1": 276.65700000000004, "r_x2": 346.062, "r_y2": 268.105, "r_x3": 308.862, "r_y3": 268.105, "coord_origin": "TOPLEFT"}, "text": "Figure 2:", "orig": "Figure 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.491, "r_y0": 276.65700000000004, "r_x1": 545.115, "r_y1": 276.65700000000004, "r_x2": 545.115, "r_y2": 268.105, "r_x3": 354.491, "r_y3": 268.105, "coord_origin": "TOPLEFT"}, "text": "Distribution of the tables across different table", "orig": "Distribution of the tables across different table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 288.612, "r_x1": 498.57, "r_y1": 288.612, "r_x2": 498.57, "r_y2": 280.06, "r_x3": 308.862, "r_y3": 280.06, "coord_origin": "TOPLEFT"}, "text": "dimensions in PubTabNet + FinTabNet datasets", "orig": "dimensions in PubTabNet + FinTabNet datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 2: Distribution of the tables across different table dimensions in PubTabNet + FinTabNet datasets"}, {"label": "text", "id": 9, "page_no": 2, "cluster": {"id": 9, "label": "text", "bbox": {"l": 308.862, "t": 317.742, "r": 437.27, "b": 326.294, "coord_origin": "TOPLEFT"}, "confidence": 0.8879811763763428, "cells": [{"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 326.294, "r_x1": 437.27, "r_y1": 326.294, "r_x2": 437.27, "r_y2": 317.742, "r_x3": 308.862, "r_y3": 317.742, "coord_origin": "TOPLEFT"}, "text": "balance in the previous datasets.", "orig": "balance in the previous datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "balance in the previous datasets."}, {"label": "text", "id": 2, "page_no": 2, "cluster": {"id": 2, "label": "text", "bbox": {"l": 308.862, "t": 331.8, "r": 545.115, "b": 627.2760000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9870319366455078, "cells": [{"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 340.352, "r_x1": 545.115, "r_y1": 340.352, "r_x2": 545.115, "r_y2": 331.8, "r_x3": 320.817, "r_y3": 331.8, "coord_origin": "TOPLEFT"}, "text": "The PubTabNet dataset contains 509k tables delivered as", "orig": "The PubTabNet dataset contains 509k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 352.307, "r_x1": 545.115, "r_y1": 352.307, "r_x2": 545.115, "r_y2": 343.755, "r_x3": 308.862, "r_y3": 343.755, "coord_origin": "TOPLEFT"}, "text": "annotated PNGimages. The annotations consist of the table", "orig": "annotated PNGimages. The annotations consist of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 364.263, "r_x1": 545.115, "r_y1": 364.263, "r_x2": 545.115, "r_y2": 355.711, "r_x3": 308.862, "r_y3": 355.711, "coord_origin": "TOPLEFT"}, "text": "structure represented in HTML format, the tokenized text", "orig": "structure represented in HTML format, the tokenized text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 376.218, "r_x1": 545.115, "r_y1": 376.218, "r_x2": 545.115, "r_y2": 367.666, "r_x3": 308.862, "r_y3": 367.666, "coord_origin": "TOPLEFT"}, "text": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 388.173, "r_x1": 545.115, "r_y1": 388.173, "r_x2": 545.115, "r_y2": 379.621, "r_x3": 308.862, "r_y3": 379.621, "coord_origin": "TOPLEFT"}, "text": "pearance style of PubTabNet. Depending on its complexity,", "orig": "pearance style of PubTabNet. Depending on its complexity,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 400.128, "r_x1": 545.115, "r_y1": 400.128, "r_x2": 545.115, "r_y2": 391.576, "r_x3": 308.862, "r_y3": 391.576, "coord_origin": "TOPLEFT"}, "text": "a table is characterized as 'simple' when it does not contain", "orig": "a table is characterized as 'simple' when it does not contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 412.083, "r_x1": 545.115, "r_y1": 412.083, "r_x2": 545.115, "r_y2": 403.531, "r_x3": 308.862, "r_y3": 403.531, "coord_origin": "TOPLEFT"}, "text": "row spans or column spans, otherwise it is 'complex'. The", "orig": "row spans or column spans, otherwise it is 'complex'. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 424.038, "r_x1": 545.115, "r_y1": 424.038, "r_x2": 545.115, "r_y2": 415.486, "r_x3": 308.862, "r_y3": 415.486, "coord_origin": "TOPLEFT"}, "text": "dataset is divided into Train and Val splits (roughly 98%and", "orig": "dataset is divided into Train and Val splits (roughly 98%and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 435.994, "r_x1": 545.115, "r_y1": 435.994, "r_x2": 545.115, "r_y2": 427.442, "r_x3": 308.862, "r_y3": 427.442, "coord_origin": "TOPLEFT"}, "text": "2%). The Train split consists of 54% simple and 46% com-", "orig": "2%). The Train split consists of 54% simple and 46% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 447.949, "r_x1": 545.115, "r_y1": 447.949, "r_x2": 545.115, "r_y2": 439.397, "r_x3": 308.862, "r_y3": 439.397, "coord_origin": "TOPLEFT"}, "text": "plex tables and the Val split of 51% and 49% respectively.", "orig": "plex tables and the Val split of 51% and 49% respectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 459.904, "r_x1": 545.115, "r_y1": 459.904, "r_x2": 545.115, "r_y2": 451.352, "r_x3": 308.862, "r_y3": 451.352, "coord_origin": "TOPLEFT"}, "text": "The FinTabNet dataset contains 112k tables delivered as", "orig": "The FinTabNet dataset contains 112k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 471.859, "r_x1": 545.115, "r_y1": 471.859, "r_x2": 545.115, "r_y2": 463.307, "r_x3": 308.862, "r_y3": 463.307, "coord_origin": "TOPLEFT"}, "text": "single-page PDFdocuments with mixed table structures and", "orig": "single-page PDFdocuments with mixed table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 483.814, "r_x1": 358.984, "r_y1": 483.814, "r_x2": 358.984, "r_y2": 475.262, "r_x3": 308.862, "r_y3": 475.262, "coord_origin": "TOPLEFT"}, "text": "text content.", "orig": "text content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.121, "r_y0": 483.814, "r_x1": 545.115, "r_y1": 483.814, "r_x2": 545.115, "r_y2": 475.262, "r_x3": 365.121, "r_y3": 475.262, "coord_origin": "TOPLEFT"}, "text": "Similarly to the PubTabNet, the annotations", "orig": "Similarly to the PubTabNet, the annotations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 495.77, "r_x1": 545.115, "r_y1": 495.77, "r_x2": 545.115, "r_y2": 487.218, "r_x3": 308.862, "r_y3": 487.218, "coord_origin": "TOPLEFT"}, "text": "of FinTabNet include the table structure in HTML, the to-", "orig": "of FinTabNet include the table structure in HTML, the to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 507.725, "r_x1": 545.115, "r_y1": 507.725, "r_x2": 545.115, "r_y2": 499.173, "r_x3": 308.862, "r_y3": 499.173, "coord_origin": "TOPLEFT"}, "text": "kenized text and the bounding boxes on a table cell basis.", "orig": "kenized text and the bounding boxes on a table cell basis.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 519.6800000000001, "r_x1": 545.115, "r_y1": 519.6800000000001, "r_x2": 545.115, "r_y2": 511.128, "r_x3": 308.862, "r_y3": 511.128, "coord_origin": "TOPLEFT"}, "text": "The dataset is divided into Train, Test and Val splits (81%,", "orig": "The dataset is divided into Train, Test and Val splits (81%,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 531.635, "r_x1": 545.115, "r_y1": 531.635, "r_x2": 545.115, "r_y2": 523.0830000000001, "r_x3": 308.862, "r_y3": 523.0830000000001, "coord_origin": "TOPLEFT"}, "text": "9.5%, 9.5%), and each one is almost equally divided into", "orig": "9.5%, 9.5%), and each one is almost equally divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 543.59, "r_x1": 545.115, "r_y1": 543.59, "r_x2": 545.115, "r_y2": 535.038, "r_x3": 308.862, "r_y3": 535.038, "coord_origin": "TOPLEFT"}, "text": "simple and complex tables (Train: 48% simple, 52% com-", "orig": "simple and complex tables (Train: 48% simple, 52% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 555.545, "r_x1": 350.964, "r_y1": 555.545, "r_x2": 350.964, "r_y2": 546.9929999999999, "r_x3": 308.862, "r_y3": 546.9929999999999, "coord_origin": "TOPLEFT"}, "text": "plex, Test:", "orig": "plex, Test:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 355.467, "r_y0": 555.545, "r_x1": 490.082, "r_y1": 555.545, "r_x2": 490.082, "r_y2": 546.9929999999999, "r_x3": 355.467, "r_y3": 546.9929999999999, "coord_origin": "TOPLEFT"}, "text": "48% simple, 52% complex, Test:", "orig": "48% simple, 52% complex, Test:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 494.595, "r_y0": 555.545, "r_x1": 545.115, "r_y1": 555.545, "r_x2": 545.115, "r_y2": 546.9929999999999, "r_x3": 494.595, "r_y3": 546.9929999999999, "coord_origin": "TOPLEFT"}, "text": "53% simple,", "orig": "53% simple,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 567.501, "r_x1": 370.6, "r_y1": 567.501, "r_x2": 370.6, "r_y2": 558.9490000000001, "r_x3": 308.862, "r_y3": 558.9490000000001, "coord_origin": "TOPLEFT"}, "text": "47% complex).", "orig": "47% complex).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.737, "r_y0": 567.501, "r_x1": 545.115, "r_y1": 567.501, "r_x2": 545.115, "r_y2": 558.9490000000001, "r_x3": 376.737, "r_y3": 558.9490000000001, "coord_origin": "TOPLEFT"}, "text": "Finally the TableBank dataset consists of", "orig": "Finally the TableBank dataset consists of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 579.456, "r_x1": 545.115, "r_y1": 579.456, "r_x2": 545.115, "r_y2": 570.904, "r_x3": 308.862, "r_y3": 570.904, "coord_origin": "TOPLEFT"}, "text": "145k tables provided as JPEG images. The latter has anno-", "orig": "145k tables provided as JPEG images. The latter has anno-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 591.4110000000001, "r_x1": 545.115, "r_y1": 591.4110000000001, "r_x2": 545.115, "r_y2": 582.859, "r_x3": 308.862, "r_y3": 582.859, "coord_origin": "TOPLEFT"}, "text": "tations for the table structure, but only few with bounding", "orig": "tations for the table structure, but only few with bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 603.366, "r_x1": 403.726, "r_y1": 603.366, "r_x2": 403.726, "r_y2": 594.814, "r_x3": 308.862, "r_y3": 594.814, "coord_origin": "TOPLEFT"}, "text": "boxes of the table cells.", "orig": "boxes of the table cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.731, "r_y0": 603.366, "r_x1": 545.115, "r_y1": 603.366, "r_x2": 545.115, "r_y2": 594.814, "r_x3": 407.731, "r_y3": 594.814, "coord_origin": "TOPLEFT"}, "text": "The entire dataset consists of sim-", "orig": "The entire dataset consists of sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 615.321, "r_x1": 545.115, "r_y1": 615.321, "r_x2": 545.115, "r_y2": 606.769, "r_x3": 308.862, "r_y3": 606.769, "coord_origin": "TOPLEFT"}, "text": "ple tables and it is divided into 90% Train, 3% Test and 7%", "orig": "ple tables and it is divided into 90% Train, 3% Test and 7%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 627.2760000000001, "r_x1": 348.164, "r_y1": 627.2760000000001, "r_x2": 348.164, "r_y2": 618.7239999999999, "r_x3": 308.862, "r_y3": 618.7239999999999, "coord_origin": "TOPLEFT"}, "text": "Val splits.", "orig": "Val splits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The PubTabNet dataset contains 509k tables delivered as annotated PNGimages. The annotations consist of the table structure represented in HTML format, the tokenized text and its bounding boxes per table cell. Fig. 1 shows the appearance style of PubTabNet. Depending on its complexity, a table is characterized as 'simple' when it does not contain row spans or column spans, otherwise it is 'complex'. The dataset is divided into Train and Val splits (roughly 98%and 2%). The Train split consists of 54% simple and 46% complex tables and the Val split of 51% and 49% respectively. The FinTabNet dataset contains 112k tables delivered as single-page PDFdocuments with mixed table structures and text content. Similarly to the PubTabNet, the annotations of FinTabNet include the table structure in HTML, the tokenized text and the bounding boxes on a table cell basis. The dataset is divided into Train, Test and Val splits (81%, 9.5%, 9.5%), and each one is almost equally divided into simple and complex tables (Train: 48% simple, 52% complex, Test: 48% simple, 52% complex, Test: 53% simple, 47% complex). Finally the TableBank dataset consists of 145k tables provided as JPEG images. The latter has annotations for the table structure, but only few with bounding boxes of the table cells. The entire dataset consists of simple tables and it is divided into 90% Train, 3% Test and 7% Val splits."}, {"label": "text", "id": 4, "page_no": 2, "cluster": {"id": 4, "label": "text", "bbox": {"l": 308.862, "t": 632.783, "r": 545.115, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9840091466903687, "cells": [{"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 641.335, "r_x1": 545.115, "r_y1": 641.335, "r_x2": 545.115, "r_y2": 632.783, "r_x3": 320.817, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "Due to the heterogeneity across the dataset formats, it", "orig": "Due to the heterogeneity across the dataset formats, it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.29, "r_x1": 545.115, "r_y1": 653.29, "r_x2": 545.115, "r_y2": 644.738, "r_x3": 308.862, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "was necessary to combine all available data into one homog-", "orig": "was necessary to combine all available data into one homog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 665.245, "r_x1": 545.115, "r_y1": 665.245, "r_x2": 545.115, "r_y2": 656.693, "r_x3": 308.862, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "enized dataset before we could train our models for practi-", "orig": "enized dataset before we could train our models for practi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 677.201, "r_x1": 361.245, "r_y1": 677.201, "r_x2": 361.245, "r_y2": 668.649, "r_x3": 308.862, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "cal purposes.", "orig": "cal purposes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.44, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 365.44, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "Given the size of PubTabNet, we adopted its", "orig": "Given the size of PubTabNet, we adopted its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 308.862, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "annotation format and we extracted and converted all tables", "orig": "annotation format and we extracted and converted all tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 487.322, "r_y1": 701.111, "r_x2": 487.322, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "as PNG images with a resolution of 72 dpi.", "orig": "as PNG images with a resolution of 72 dpi.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 492.901, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 492.901, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Additionally,", "orig": "Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "we have filtered out tables with extreme sizes due to small", "orig": "we have filtered out tables with extreme sizes due to small", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Due to the heterogeneity across the dataset formats, it was necessary to combine all available data into one homogenized dataset before we could train our models for practical purposes. Given the size of PubTabNet, we adopted its annotation format and we extracted and converted all tables as PNG images with a resolution of 72 dpi. Additionally, we have filtered out tables with extreme sizes due to small"}, {"label": "page_footer", "id": 11, "page_no": 2, "cluster": {"id": 11, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8715606927871704, "cells": [{"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3"}], "body": [{"label": "text", "id": 10, "page_no": 2, "cluster": {"id": 10, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 250.151, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.8767216801643372, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 250.151, "r_y1": 84.029, "r_x2": 250.151, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "tag-decoder which is constrained to the table-tags.", "orig": "tag-decoder which is constrained to the table-tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "tag-decoder which is constrained to the table-tags."}, {"label": "text", "id": 5, "page_no": 2, "cluster": {"id": 5, "label": "text", "bbox": {"l": 50.112, "t": 87.48800000000006, "r": 286.365, "b": 275.36800000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9822593927383423, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 96.03999999999996, "r_x1": 70.366, "r_y1": 96.03999999999996, "r_x2": 70.366, "r_y2": 87.48800000000006, "r_x3": 62.067, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.931, "r_y0": 96.03999999999996, "r_x1": 110.953, "r_y1": 96.03999999999996, "r_x2": 110.953, "r_y2": 87.48800000000006, "r_x3": 76.931, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "practice,", "orig": "practice,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 118.545, "r_y0": 96.03999999999996, "r_x1": 136.258, "r_y1": 96.03999999999996, "r_x2": 136.258, "r_y2": 87.48800000000006, "r_x3": 118.545, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "both", "orig": "both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.824, "r_y0": 96.03999999999996, "r_x1": 175.372, "r_y1": 96.03999999999996, "r_x2": 175.372, "r_y2": 87.48800000000006, "r_x3": 142.824, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.947, "r_y0": 96.03999999999996, "r_x1": 232.836, "r_y1": 96.03999999999996, "r_x2": 232.836, "r_y2": 87.48800000000006, "r_x3": 181.947, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "architectures", "orig": "architectures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.411, "r_y0": 96.03999999999996, "r_x1": 265.414, "r_y1": 96.03999999999996, "r_x2": 265.414, "r_y2": 87.48800000000006, "r_x3": 239.411, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "(IETD", "orig": "(IETD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 271.979, "r_y0": 96.03999999999996, "r_x1": 286.365, "r_y1": 96.03999999999996, "r_x2": 286.365, "r_y2": 87.48800000000006, "r_x3": 271.979, "r_y3": 87.48800000000006, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 107.995, "r_x1": 286.365, "r_y1": 107.995, "r_x2": 286.365, "r_y2": 99.44299999999998, "r_x3": 50.112, "r_y3": 99.44299999999998, "coord_origin": "TOPLEFT"}, "text": "IEDD) require an implicit, custom trained object-character-", "orig": "IEDD) require an implicit, custom trained object-character-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 119.95100000000002, "r_x1": 286.365, "r_y1": 119.95100000000002, "r_x2": 286.365, "r_y2": 111.399, "r_x3": 50.112, "r_y3": 111.399, "coord_origin": "TOPLEFT"}, "text": "recognition (OCR) to obtain the content of the table-cells.", "orig": "recognition (OCR) to obtain the content of the table-cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 131.90599999999995, "r_x1": 286.365, "r_y1": 131.90599999999995, "r_x2": 286.365, "r_y2": 123.35400000000004, "r_x3": 50.112, "r_y3": 123.35400000000004, "coord_origin": "TOPLEFT"}, "text": "In the case of IETD, this OCR engine is implicit in the de-", "orig": "In the case of IETD, this OCR engine is implicit in the de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 143.861, "r_x1": 286.365, "r_y1": 143.861, "r_x2": 286.365, "r_y2": 135.30899999999997, "r_x3": 50.112, "r_y3": 135.30899999999997, "coord_origin": "TOPLEFT"}, "text": "coder similar to [24]. For the IEDD, the OCR is solely em-", "orig": "coder similar to [24]. For the IEDD, the OCR is solely em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 155.81600000000003, "r_x1": 174.206, "r_y1": 155.81600000000003, "r_x2": 174.206, "r_y2": 147.264, "r_x3": 50.112, "r_y3": 147.264, "coord_origin": "TOPLEFT"}, "text": "bedded in the content-decoder.", "orig": "bedded in the content-decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 179.098, "r_y0": 155.81600000000003, "r_x1": 286.365, "r_y1": 155.81600000000003, "r_x2": 286.365, "r_y2": 147.264, "r_x3": 179.098, "r_y3": 147.264, "coord_origin": "TOPLEFT"}, "text": "This reliance on a custom,", "orig": "This reliance on a custom,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 167.77099999999996, "r_x1": 243.267, "r_y1": 167.77099999999996, "r_x2": 243.267, "r_y2": 159.21900000000005, "r_x3": 50.112, "r_y3": 159.21900000000005, "coord_origin": "TOPLEFT"}, "text": "implicit OCR decoder is of course problematic.", "orig": "implicit OCR decoder is of course problematic.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.437, "r_y0": 167.77099999999996, "r_x1": 286.365, "r_y1": 167.77099999999996, "r_x2": 286.365, "r_y2": 159.21900000000005, "r_x3": 248.437, "r_y3": 159.21900000000005, "coord_origin": "TOPLEFT"}, "text": "OCR is a", "orig": "OCR is a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 179.726, "r_x1": 286.365, "r_y1": 179.726, "r_x2": 286.365, "r_y2": 171.17399999999998, "r_x3": 50.112, "r_y3": 171.17399999999998, "coord_origin": "TOPLEFT"}, "text": "well known and extremely tough problem, that often needs", "orig": "well known and extremely tough problem, that often needs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 191.68200000000002, "r_x1": 286.365, "r_y1": 191.68200000000002, "r_x2": 286.365, "r_y2": 183.13, "r_x3": 50.112, "r_y3": 183.13, "coord_origin": "TOPLEFT"}, "text": "custom training for each individual language. However, the", "orig": "custom training for each individual language. However, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 203.63699999999994, "r_x1": 126.655, "r_y1": 203.63699999999994, "r_x2": 126.655, "r_y2": 195.08500000000004, "r_x3": 50.112, "r_y3": 195.08500000000004, "coord_origin": "TOPLEFT"}, "text": "limited availability", "orig": "limited availability", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 130.59, "r_y0": 203.63699999999994, "r_x1": 142.206, "r_y1": 203.63699999999994, "r_x2": 142.206, "r_y2": 195.08500000000004, "r_x3": 130.59, "r_y3": 195.08500000000004, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 146.132, "r_y0": 203.63699999999994, "r_x1": 286.365, "r_y1": 203.63699999999994, "r_x2": 286.365, "r_y2": 195.08500000000004, "r_x3": 146.132, "r_y3": 195.08500000000004, "coord_origin": "TOPLEFT"}, "text": "non-english content in the current", "orig": "non-english content in the current", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 215.59199999999998, "r_x1": 286.365, "r_y1": 215.59199999999998, "r_x2": 286.365, "r_y2": 207.03999999999996, "r_x3": 50.112, "r_y3": 207.03999999999996, "coord_origin": "TOPLEFT"}, "text": "datasets, makes it impractical to apply the IETD and IEDD", "orig": "datasets, makes it impractical to apply the IETD and IEDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 227.54700000000003, "r_x1": 286.365, "r_y1": 227.54700000000003, "r_x2": 286.365, "r_y2": 218.995, "r_x3": 50.112, "r_y3": 218.995, "coord_origin": "TOPLEFT"}, "text": "methods on tables with other languages. Additionally, OCR", "orig": "methods on tables with other languages. Additionally, OCR", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 239.50199999999995, "r_x1": 286.365, "r_y1": 239.50199999999995, "r_x2": 286.365, "r_y2": 230.95000000000005, "r_x3": 50.112, "r_y3": 230.95000000000005, "coord_origin": "TOPLEFT"}, "text": "can be completely omitted if the tables originate from pro-", "orig": "can be completely omitted if the tables originate from pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 251.457, "r_x1": 286.365, "r_y1": 251.457, "r_x2": 286.365, "r_y2": 242.90499999999997, "r_x3": 50.112, "r_y3": 242.90499999999997, "coord_origin": "TOPLEFT"}, "text": "grammatic PDF documents with known positions of each", "orig": "grammatic PDF documents with known positions of each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 263.413, "r_x1": 66.989, "r_y1": 263.413, "r_x2": 66.989, "r_y2": 254.861, "r_x3": 50.112, "r_y3": 254.861, "coord_origin": "TOPLEFT"}, "text": "cell.", "orig": "cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 71.382, "r_y0": 263.413, "r_x1": 286.365, "r_y1": 263.413, "r_x2": 286.365, "r_y2": 254.861, "r_x3": 71.382, "r_y3": 254.861, "coord_origin": "TOPLEFT"}, "text": "The latter was the inspiration for the work of this pa-", "orig": "The latter was the inspiration for the work of this pa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 275.36800000000005, "r_x1": 64.777, "r_y1": 275.36800000000005, "r_x2": 64.777, "r_y2": 266.81600000000003, "r_x3": 50.112, "r_y3": 266.81600000000003, "coord_origin": "TOPLEFT"}, "text": "per.", "orig": "per.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In practice, both network architectures (IETD and IEDD) require an implicit, custom trained object-characterrecognition (OCR) to obtain the content of the table-cells. In the case of IETD, this OCR engine is implicit in the decoder similar to [24]. For the IEDD, the OCR is solely embedded in the content-decoder. This reliance on a custom, implicit OCR decoder is of course problematic. OCR is a well known and extremely tough problem, that often needs custom training for each individual language. However, the limited availability for non-english content in the current datasets, makes it impractical to apply the IETD and IEDD methods on tables with other languages. Additionally, OCR can be completely omitted if the tables originate from programmatic PDF documents with known positions of each cell. The latter was the inspiration for the work of this paper."}, {"label": "text", "id": 0, "page_no": 2, "cluster": {"id": 0, "label": "text", "bbox": {"l": 50.112, "t": 278.43899999999996, "r": 286.365, "b": 490.617, "coord_origin": "TOPLEFT"}, "confidence": 0.9878450036048889, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 287.395, "r_x1": 90.301, "r_y1": 287.395, "r_x2": 90.301, "r_y2": 278.43899999999996, "r_x3": 62.067, "r_y3": 278.43899999999996, "coord_origin": "TOPLEFT"}, "text": "Graph", "orig": "Graph", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.677, "r_y0": 287.395, "r_x1": 126.007, "r_y1": 287.395, "r_x2": 126.007, "r_y2": 278.43899999999996, "r_x3": 96.677, "r_y3": 278.43899999999996, "coord_origin": "TOPLEFT"}, "text": "Neural", "orig": "Neural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.373, "r_y0": 287.395, "r_x1": 171.566, "r_y1": 287.395, "r_x2": 171.566, "r_y2": 278.43899999999996, "r_x3": 132.373, "r_y3": 278.43899999999996, "coord_origin": "TOPLEFT"}, "text": "networks", "orig": "networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.568, "r_y0": 287.379, "r_x1": 174.338, "r_y1": 287.379, "r_x2": 174.338, "r_y2": 278.827, "r_x3": 171.568, "r_y3": 278.827, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.187, "r_y0": 287.379, "r_x1": 210.083, "r_y1": 287.379, "r_x2": 210.083, "r_y2": 278.827, "r_x3": 185.187, "r_y3": 278.827, "coord_origin": "TOPLEFT"}, "text": "Graph", "orig": "Graph", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.459, "r_y0": 287.379, "r_x1": 243.568, "r_y1": 287.379, "r_x2": 243.568, "r_y2": 278.827, "r_x3": 216.459, "r_y3": 278.827, "coord_origin": "TOPLEFT"}, "text": "Neural", "orig": "Neural", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.944, "r_y0": 287.379, "r_x1": 286.357, "r_y1": 287.379, "r_x2": 286.357, "r_y2": 278.827, "r_x3": 249.944, "r_y3": 278.827, "coord_origin": "TOPLEFT"}, "text": "networks", "orig": "networks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 299.335, "r_x1": 84.971, "r_y1": 299.335, "r_x2": 84.971, "r_y2": 290.783, "r_x3": 50.112, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "(GNN's)", "orig": "(GNN's)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.347, "r_y0": 299.335, "r_x1": 107.845, "r_y1": 299.335, "r_x2": 107.845, "r_y2": 290.783, "r_x3": 91.347, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "take", "orig": "take", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 114.211, "r_y0": 299.335, "r_x1": 118.635, "r_y1": 299.335, "r_x2": 118.635, "r_y2": 290.783, "r_x3": 114.211, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.011, "r_y0": 299.335, "r_x1": 159.87, "r_y1": 299.335, "r_x2": 159.87, "r_y2": 290.783, "r_x3": 125.011, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "radically", "orig": "radically", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.246, "r_y0": 299.335, "r_x1": 200.298, "r_y1": 299.335, "r_x2": 200.298, "r_y2": 290.783, "r_x3": 166.246, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "different", "orig": "different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.664, "r_y0": 299.335, "r_x1": 243.177, "r_y1": 299.335, "r_x2": 243.177, "r_y2": 290.783, "r_x3": 206.664, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "approach", "orig": "approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.553, "r_y0": 299.335, "r_x1": 257.304, "r_y1": 299.335, "r_x2": 257.304, "r_y2": 290.783, "r_x3": 249.553, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.68, "r_y0": 299.335, "r_x1": 286.365, "r_y1": 299.335, "r_x2": 286.365, "r_y2": 290.783, "r_x3": 263.68, "r_y3": 290.783, "coord_origin": "TOPLEFT"}, "text": "table-", "orig": "table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 311.29, "r_x1": 84.971, "r_y1": 311.29, "r_x2": 84.971, "r_y2": 302.738, "r_x3": 50.112, "r_y3": 302.738, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.986, "r_y0": 311.29, "r_x1": 131.168, "r_y1": 311.29, "r_x2": 131.168, "r_y2": 302.738, "r_x3": 88.986, "r_y3": 302.738, "coord_origin": "TOPLEFT"}, "text": "extraction.", "orig": "extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.849, "r_y0": 311.29, "r_x1": 286.365, "r_y1": 311.29, "r_x2": 286.365, "r_y2": 302.738, "r_x3": 138.849, "r_y3": 302.738, "coord_origin": "TOPLEFT"}, "text": "Note that one table cell can consti-", "orig": "Note that one table cell can consti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 323.245, "r_x1": 286.365, "r_y1": 323.245, "r_x2": 286.365, "r_y2": 314.693, "r_x3": 50.112, "r_y3": 314.693, "coord_origin": "TOPLEFT"}, "text": "tute out of multiple text-cells. To obtain the table-structure,", "orig": "tute out of multiple text-cells. To obtain the table-structure,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 335.2, "r_x1": 136.996, "r_y1": 335.2, "r_x2": 136.996, "r_y2": 326.648, "r_x3": 50.112, "r_y3": 326.648, "coord_origin": "TOPLEFT"}, "text": "one creates an initial", "orig": "one creates an initial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.051, "r_y0": 335.2, "r_x1": 166.226, "r_y1": 335.2, "r_x2": 166.226, "r_y2": 326.648, "r_x3": 141.051, "r_y3": 326.648, "coord_origin": "TOPLEFT"}, "text": "graph,", "orig": "graph,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.679, "r_y0": 335.2, "r_x1": 286.365, "r_y1": 335.2, "r_x2": 286.365, "r_y2": 326.648, "r_x3": 170.679, "r_y3": 326.648, "coord_origin": "TOPLEFT"}, "text": "where each of the text-cells", "orig": "where each of the text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 347.155, "r_x1": 260.442, "r_y1": 347.155, "r_x2": 260.442, "r_y2": 338.603, "r_x3": 50.112, "r_y3": 338.603, "coord_origin": "TOPLEFT"}, "text": "becomes a node in the graph similar to [33, 34, 2].", "orig": "becomes a node in the graph similar to [33, 34, 2].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.45, "r_y0": 347.155, "r_x1": 286.365, "r_y1": 347.155, "r_x2": 286.365, "r_y2": 338.603, "r_x3": 266.45, "r_y3": 338.603, "coord_origin": "TOPLEFT"}, "text": "Each", "orig": "Each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 359.11, "r_x1": 286.365, "r_y1": 359.11, "r_x2": 286.365, "r_y2": 350.558, "r_x3": 50.112, "r_y3": 350.558, "coord_origin": "TOPLEFT"}, "text": "node is then associated with en embedding vector coming", "orig": "node is then associated with en embedding vector coming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 371.066, "r_x1": 286.365, "r_y1": 371.066, "r_x2": 286.365, "r_y2": 362.514, "r_x3": 50.112, "r_y3": 362.514, "coord_origin": "TOPLEFT"}, "text": "from the encoded image, its coordinates and the encoded", "orig": "from the encoded image, its coordinates and the encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 383.021, "r_x1": 67.397, "r_y1": 383.021, "r_x2": 67.397, "r_y2": 374.469, "r_x3": 50.112, "r_y3": 374.469, "coord_origin": "TOPLEFT"}, "text": "text.", "orig": "text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 72.976, "r_y0": 383.021, "r_x1": 286.365, "r_y1": 383.021, "r_x2": 286.365, "r_y2": 374.469, "r_x3": 72.976, "r_y3": 374.469, "coord_origin": "TOPLEFT"}, "text": "Furthermore, nodes that represent adjacent text-cells", "orig": "Furthermore, nodes that represent adjacent text-cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 394.976, "r_x1": 92.602, "r_y1": 394.976, "r_x2": 92.602, "r_y2": 386.424, "r_x3": 50.112, "r_y3": 386.424, "coord_origin": "TOPLEFT"}, "text": "are linked.", "orig": "are linked.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 97.305, "r_y0": 394.976, "r_x1": 286.365, "r_y1": 394.976, "r_x2": 286.365, "r_y2": 386.424, "r_x3": 97.305, "r_y3": 386.424, "coord_origin": "TOPLEFT"}, "text": "Graph Convolutional Networks (GCN's) based", "orig": "Graph Convolutional Networks (GCN's) based", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 406.931, "r_x1": 286.365, "r_y1": 406.931, "r_x2": 286.365, "r_y2": 398.379, "r_x3": 50.112, "r_y3": 398.379, "coord_origin": "TOPLEFT"}, "text": "methods take the image as an input, but also the position of", "orig": "methods take the image as an input, but also the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 418.886, "r_x1": 286.365, "r_y1": 418.886, "r_x2": 286.365, "r_y2": 410.334, "r_x3": 50.112, "r_y3": 410.334, "coord_origin": "TOPLEFT"}, "text": "the text-cells and their content [18]. The purpose of a GCN", "orig": "the text-cells and their content [18]. The purpose of a GCN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 430.841, "r_x1": 286.365, "r_y1": 430.841, "r_x2": 286.365, "r_y2": 422.289, "r_x3": 50.112, "r_y3": 422.289, "coord_origin": "TOPLEFT"}, "text": "is to transform the input graph into a new graph, which re-", "orig": "is to transform the input graph into a new graph, which re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 442.797, "r_x1": 198.236, "r_y1": 442.797, "r_x2": 198.236, "r_y2": 434.245, "r_x3": 50.112, "r_y3": 434.245, "coord_origin": "TOPLEFT"}, "text": "places the old links with new ones.", "orig": "places the old links with new ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 205.927, "r_y0": 442.797, "r_x1": 286.365, "r_y1": 442.797, "r_x2": 286.365, "r_y2": 434.245, "r_x3": 205.927, "r_y3": 434.245, "coord_origin": "TOPLEFT"}, "text": "The new links then", "orig": "The new links then", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 454.752, "r_x1": 165.618, "r_y1": 454.752, "r_x2": 165.618, "r_y2": 446.2, "r_x3": 50.112, "r_y3": 446.2, "coord_origin": "TOPLEFT"}, "text": "represent the table-structure.", "orig": "represent the table-structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.417, "r_y0": 454.752, "r_x1": 286.365, "r_y1": 454.752, "r_x2": 286.365, "r_y2": 446.2, "r_x3": 171.417, "r_y3": 446.2, "coord_origin": "TOPLEFT"}, "text": "With this approach, one can", "orig": "With this approach, one can", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 466.707, "r_x1": 242.36, "r_y1": 466.707, "r_x2": 242.36, "r_y2": 458.155, "r_x3": 50.112, "r_y3": 458.155, "coord_origin": "TOPLEFT"}, "text": "avoid the need to build custom OCR decoders.", "orig": "avoid the need to build custom OCR decoders.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.408, "r_y0": 466.707, "r_x1": 286.365, "r_y1": 466.707, "r_x2": 286.365, "r_y2": 458.155, "r_x3": 248.408, "r_y3": 458.155, "coord_origin": "TOPLEFT"}, "text": "However,", "orig": "However,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 478.662, "r_x1": 286.365, "r_y1": 478.662, "r_x2": 286.365, "r_y2": 470.11, "r_x3": 50.112, "r_y3": 470.11, "coord_origin": "TOPLEFT"}, "text": "the quality of the reconstructed structure is not comparable", "orig": "the quality of the reconstructed structure is not comparable", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 490.617, "r_x1": 186.5, "r_y1": 490.617, "r_x2": 186.5, "r_y2": 482.065, "r_x3": 50.112, "r_y3": 482.065, "coord_origin": "TOPLEFT"}, "text": "to the current state-of-the-art [18].", "orig": "to the current state-of-the-art [18].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Graph Neural networks : Graph Neural networks (GNN's) take a radically different approach to tablestructure extraction. Note that one table cell can constitute out of multiple text-cells. To obtain the table-structure, one creates an initial graph, where each of the text-cells becomes a node in the graph similar to [33, 34, 2]. Each node is then associated with en embedding vector coming from the encoded image, its coordinates and the encoded text. Furthermore, nodes that represent adjacent text-cells are linked. Graph Convolutional Networks (GCN's) based methods take the image as an input, but also the position of the text-cells and their content [18]. The purpose of a GCN is to transform the input graph into a new graph, which replaces the old links with new ones. The new links then represent the table-structure. With this approach, one can avoid the need to build custom OCR decoders. However, the quality of the reconstructed structure is not comparable to the current state-of-the-art [18]."}, {"label": "text", "id": 1, "page_no": 2, "cluster": {"id": 1, "label": "text", "bbox": {"l": 50.112, "t": 493.689, "r": 286.366, "b": 622.181, "coord_origin": "TOPLEFT"}, "confidence": 0.9875094294548035, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 502.645, "r_x1": 252.881, "r_y1": 502.645, "r_x2": 252.881, "r_y2": 493.689, "r_x3": 62.067, "r_y3": 493.689, "coord_origin": "TOPLEFT"}, "text": "Hybrid Deep Learning-Rule-Based approach", "orig": "Hybrid Deep Learning-Rule-Based approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 252.882, "r_y0": 502.629, "r_x1": 255.652, "r_y1": 502.629, "r_x2": 255.652, "r_y2": 494.077, "r_x3": 252.882, "r_y3": 494.077, "coord_origin": "TOPLEFT"}, "text": ":", "orig": ":", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 258.63, "r_y0": 502.629, "r_x1": 286.366, "r_y1": 502.629, "r_x2": 286.366, "r_y2": 494.077, "r_x3": 258.63, "r_y3": 494.077, "coord_origin": "TOPLEFT"}, "text": "Apop-", "orig": "Apop-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 514.5840000000001, "r_x1": 286.365, "r_y1": 514.5840000000001, "r_x2": 286.365, "r_y2": 506.032, "r_x3": 50.112, "r_y3": 506.032, "coord_origin": "TOPLEFT"}, "text": "ular current model for table-structure identification is the", "orig": "ular current model for table-structure identification is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 526.539, "r_x1": 286.365, "r_y1": 526.539, "r_x2": 286.365, "r_y2": 517.9870000000001, "r_x3": 50.112, "r_y3": 517.9870000000001, "coord_origin": "TOPLEFT"}, "text": "use of a hybrid Deep Learning-Rule-Based approach similar", "orig": "use of a hybrid Deep Learning-Rule-Based approach similar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 538.494, "r_x1": 286.365, "r_y1": 538.494, "r_x2": 286.365, "r_y2": 529.942, "r_x3": 50.112, "r_y3": 529.942, "coord_origin": "TOPLEFT"}, "text": "to [27, 29]. In this approach, one first detects the position of", "orig": "to [27, 29]. In this approach, one first detects the position of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 550.45, "r_x1": 286.365, "r_y1": 550.45, "r_x2": 286.365, "r_y2": 541.898, "r_x3": 50.112, "r_y3": 541.898, "coord_origin": "TOPLEFT"}, "text": "the table-cells with object detection (e.g. YoloVx or Mask-", "orig": "the table-cells with object detection (e.g. YoloVx or Mask-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 562.405, "r_x1": 286.365, "r_y1": 562.405, "r_x2": 286.365, "r_y2": 553.8530000000001, "r_x3": 50.112, "r_y3": 553.8530000000001, "coord_origin": "TOPLEFT"}, "text": "RCNN), then classifies the table into different types (from", "orig": "RCNN), then classifies the table into different types (from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 574.36, "r_x1": 59.527, "r_y1": 574.36, "r_x2": 59.527, "r_y2": 565.808, "r_x3": 50.112, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "its", "orig": "its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 64.259, "r_y0": 574.36, "r_x1": 95.8, "r_y1": 574.36, "r_x2": 95.8, "r_y2": 565.808, "r_x3": 64.259, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "images)", "orig": "images)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 100.523, "r_y0": 574.36, "r_x1": 145.105, "r_y1": 574.36, "r_x2": 145.105, "r_y2": 565.808, "r_x3": 100.523, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "and finally", "orig": "and finally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.828, "r_y0": 574.36, "r_x1": 166.983, "r_y1": 574.36, "r_x2": 166.983, "r_y2": 565.808, "r_x3": 149.828, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "uses", "orig": "uses", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.715, "r_y0": 574.36, "r_x1": 205.768, "r_y1": 574.36, "r_x2": 205.768, "r_y2": 565.808, "r_x3": 171.715, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "different", "orig": "different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.5, "r_y0": 574.36, "r_x1": 244.243, "r_y1": 574.36, "r_x2": 244.243, "r_y2": 565.808, "r_x3": 210.5, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "rule-sets", "orig": "rule-sets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 248.975, "r_y0": 574.36, "r_x1": 256.726, "r_y1": 574.36, "r_x2": 256.726, "r_y2": 565.808, "r_x3": 248.975, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 261.459, "r_y0": 574.36, "r_x1": 286.365, "r_y1": 574.36, "r_x2": 286.365, "r_y2": 565.808, "r_x3": 261.459, "r_y3": 565.808, "coord_origin": "TOPLEFT"}, "text": "obtain", "orig": "obtain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 586.315, "r_x1": 122.64, "r_y1": 586.315, "r_x2": 122.64, "r_y2": 577.763, "r_x3": 50.112, "r_y3": 577.763, "coord_origin": "TOPLEFT"}, "text": "its table-structure.", "orig": "its table-structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 127.482, "r_y0": 586.315, "r_x1": 286.365, "r_y1": 586.315, "r_x2": 286.365, "r_y2": 577.763, "r_x3": 127.482, "r_y3": 577.763, "coord_origin": "TOPLEFT"}, "text": "Currently, this approach achieves state-", "orig": "Currently, this approach achieves state-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 598.27, "r_x1": 87.731, "r_y1": 598.27, "r_x2": 87.731, "r_y2": 589.718, "r_x3": 50.112, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "of-the-art", "orig": "of-the-art", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.074, "r_y0": 598.27, "r_x1": 120.577, "r_y1": 598.27, "r_x2": 120.577, "r_y2": 589.718, "r_x3": 92.074, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "results,", "orig": "results,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.389, "r_y0": 598.27, "r_x1": 137.922, "r_y1": 598.27, "r_x2": 137.922, "r_y2": 589.718, "r_x3": 125.389, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "but", "orig": "but", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.266, "r_y0": 598.27, "r_x1": 148.911, "r_y1": 598.27, "r_x2": 148.911, "r_y2": 589.718, "r_x3": 142.266, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.255, "r_y0": 598.27, "r_x1": 165.987, "r_y1": 598.27, "r_x2": 165.987, "r_y2": 589.718, "r_x3": 153.255, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "not", "orig": "not", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.331, "r_y0": 598.27, "r_x1": 286.365, "r_y1": 598.27, "r_x2": 286.365, "r_y2": 589.718, "r_x3": 170.331, "r_y3": 589.718, "coord_origin": "TOPLEFT"}, "text": "an end-to-end deep-learning", "orig": "an end-to-end deep-learning", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 610.225, "r_x1": 82.49, "r_y1": 610.225, "r_x2": 82.49, "r_y2": 601.673, "r_x3": 50.112, "r_y3": 601.673, "coord_origin": "TOPLEFT"}, "text": "method.", "orig": "method.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.173, "r_y0": 610.225, "r_x1": 286.365, "r_y1": 610.225, "r_x2": 286.365, "r_y2": 601.673, "r_x3": 87.173, "r_y3": 601.673, "coord_origin": "TOPLEFT"}, "text": "As such, new rules need to be written if different", "orig": "As such, new rules need to be written if different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 622.181, "r_x1": 175.989, "r_y1": 622.181, "r_x2": 175.989, "r_y2": 613.629, "r_x3": 50.112, "r_y3": 613.629, "coord_origin": "TOPLEFT"}, "text": "types of tables are encountered.", "orig": "types of tables are encountered.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Hybrid Deep Learning-Rule-Based approach : Apopular current model for table-structure identification is the use of a hybrid Deep Learning-Rule-Based approach similar to [27, 29]. In this approach, one first detects the position of the table-cells with object detection (e.g. YoloVx or MaskRCNN), then classifies the table into different types (from its images) and finally uses different rule-sets to obtain its table-structure. Currently, this approach achieves stateof-the-art results, but is not an end-to-end deep-learning method. As such, new rules need to be written if different types of tables are encountered."}, {"label": "section_header", "id": 8, "page_no": 2, "cluster": {"id": 8, "label": "section_header", "bbox": {"l": 50.112, "t": 635.9449999999999, "r": 105.225, "b": 646.693, "coord_origin": "TOPLEFT"}, "confidence": 0.9423062205314636, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 646.693, "r_x1": 105.225, "r_y1": 646.693, "r_x2": 105.225, "r_y2": 635.9449999999999, "r_x3": 50.112, "r_y3": 635.9449999999999, "coord_origin": "TOPLEFT"}, "text": "3. Datasets", "orig": "3. Datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3. Datasets"}, {"label": "text", "id": 3, "page_no": 2, "cluster": {"id": 3, "label": "text", "bbox": {"l": 50.112, "t": 656.694, "r": 286.365, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9862047433853149, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 665.246, "r_x1": 286.365, "r_y1": 665.246, "r_x2": 286.365, "r_y2": 656.694, "r_x3": 62.067, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "We rely on large-scale datasets such as PubTabNet [37],", "orig": "We rely on large-scale datasets such as PubTabNet [37],", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.201, "r_x1": 286.365, "r_y1": 677.201, "r_x2": 286.365, "r_y2": 668.649, "r_x3": 50.112, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "FinTabNet [36], and TableBank [17] datasets to train and", "orig": "FinTabNet [36], and TableBank [17] datasets to train and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 133.479, "r_y1": 689.156, "r_x2": 133.479, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "evaluate our models.", "orig": "evaluate our models.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.271, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 138.271, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "These datasets span over various ap-", "orig": "These datasets span over various ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 166.246, "r_y1": 701.111, "r_x2": 166.246, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "pearance styles and content.", "orig": "pearance styles and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 173.688, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 173.688, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "We also introduce our own", "orig": "We also introduce our own", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "synthetically generated SynthTabNet dataset to fix an im-", "orig": "synthetically generated SynthTabNet dataset to fix an im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We rely on large-scale datasets such as PubTabNet [37], FinTabNet [36], and TableBank [17] datasets to train and evaluate our models. These datasets span over various appearance styles and content. We also introduce our own synthetically generated SynthTabNet dataset to fix an im-"}, {"label": "picture", "id": 6, "page_no": 2, "cluster": {"id": 6, "label": "picture", "bbox": {"l": 312.10369873046875, "t": 78.44086456298828, "r": 550.38916015625, "b": 250.60984802246094, "coord_origin": "TOPLEFT"}, "confidence": 0.9746918082237244, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.799, "r_y0": 88.46699999999998, "r_x1": 486.849, "r_y1": 88.46699999999998, "r_x2": 486.849, "r_y2": 80.154, "r_x3": 380.799, "r_y3": 80.154, "coord_origin": "TOPLEFT"}, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.768, "r_y0": 250.68200000000002, "r_x1": 469.787, "r_y1": 250.68200000000002, "r_x2": 469.787, "r_y2": 242.36900000000003, "r_x3": 396.768, "r_y3": 242.36900000000003, "coord_origin": "TOPLEFT"}, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.977, "r_y0": 239.19299999999998, "r_x1": 324.793, "r_y1": 239.19299999999998, "r_x2": 324.793, "r_y2": 233.65099999999995, "r_x3": 320.977, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.483, "r_y0": 239.19299999999998, "r_x1": 418.113, "r_y1": 239.19299999999998, "r_x2": 418.113, "r_y2": 233.65099999999995, "r_x3": 410.483, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.85, "r_y0": 239.19299999999998, "r_x1": 508.48, "r_y1": 239.19299999999998, "r_x2": 508.48, "r_y2": 233.65099999999995, "r_x3": 500.85, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.3, "r_y0": 239.19299999999998, "r_x1": 372.93, "r_y1": 239.19299999999998, "r_x2": 372.93, "r_y2": 233.65099999999995, "r_x3": 365.3, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.666, "r_y0": 239.19299999999998, "r_x1": 463.296, "r_y1": 239.19299999999998, "r_x2": 463.296, "r_y2": 233.65099999999995, "r_x3": 455.666, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 542.035, "r_y0": 239.19299999999998, "r_x1": 549.665, "r_y1": 239.19299999999998, "r_x2": 549.665, "r_y2": 233.65099999999995, "r_x3": 542.035, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 316.045, "r_y0": 236.21699999999998, "r_x1": 319.861, "r_y1": 236.21699999999998, "r_x2": 319.861, "r_y2": 230.67399999999998, "r_x3": 316.045, "r_y3": 230.67399999999998, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.625, "r_y0": 204.461, "r_x1": 320.255, "r_y1": 204.461, "r_x2": 320.255, "r_y2": 198.91899999999998, "r_x3": 312.625, "r_y3": 198.91899999999998, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.15, "r_y0": 173.86800000000005, "r_x1": 320.78, "r_y1": 173.86800000000005, "r_x2": 320.78, "r_y2": 168.32600000000002, "r_x3": 313.15, "r_y3": 168.32600000000002, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.93, "r_y0": 142.35799999999995, "r_x1": 320.56, "r_y1": 142.35799999999995, "r_x2": 320.56, "r_y2": 136.81600000000003, "r_x3": 312.93, "r_y3": 136.81600000000003, "coord_origin": "TOPLEFT"}, "text": "60", "orig": "60", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.482, "r_y0": 111.37199999999996, "r_x1": 320.112, "r_y1": 111.37199999999996, "r_x2": 320.112, "r_y2": 105.83000000000004, "r_x3": 312.482, "r_y3": 105.83000000000004, "coord_origin": "TOPLEFT"}, "text": "80", "orig": "80", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.482, "r_y0": 218.02999999999997, "r_x1": 320.112, "r_y1": 218.02999999999997, "r_x2": 320.112, "r_y2": 212.48699999999997, "r_x3": 312.482, "r_y3": 212.48699999999997, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.076, "r_y0": 189.49199999999996, "r_x1": 320.707, "r_y1": 189.49199999999996, "r_x2": 320.707, "r_y2": 183.95000000000005, "r_x3": 313.076, "r_y3": 183.95000000000005, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.763, "r_y0": 158.24400000000003, "r_x1": 320.393, "r_y1": 158.24400000000003, "r_x2": 320.393, "r_y2": 152.702, "r_x3": 312.763, "r_y3": 152.702, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.198, "r_y0": 126.34100000000001, "r_x1": 319.828, "r_y1": 126.34100000000001, "r_x2": 319.828, "r_y2": 120.798, "r_x3": 312.198, "r_y3": 120.798, "coord_origin": "TOPLEFT"}, "text": "70", "orig": "70", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.817, "r_y0": 95.87900000000002, "r_x1": 320.447, "r_y1": 95.87900000000002, "r_x2": 320.447, "r_y2": 90.33699999999999, "r_x3": 312.817, "r_y3": 90.33699999999999, "coord_origin": "TOPLEFT"}, "text": "90", "orig": "90", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.174, "r_y0": 229.94000000000005, "r_x1": 536.944, "r_y1": 229.94000000000005, "r_x2": 536.944, "r_y2": 223.01199999999994, "r_x3": 532.174, "r_y3": 223.01199999999994, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.88, "r_y0": 115.48000000000002, "r_x1": 547.613, "r_y1": 115.48000000000002, "r_x2": 547.613, "r_y2": 108.55200000000002, "r_x3": 532.88, "r_y3": 108.55200000000002, "coord_origin": "TOPLEFT"}, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.774, "r_y0": 137.99400000000003, "r_x1": 542.739, "r_y1": 137.99400000000003, "r_x2": 542.739, "r_y2": 131.06600000000003, "r_x3": 532.774, "r_y3": 131.06600000000003, "coord_origin": "TOPLEFT"}, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.799, "r_y0": 161.13599999999997, "r_x1": 542.764, "r_y1": 161.13599999999997, "r_x2": 542.764, "r_y2": 154.20799999999997, "r_x3": 532.799, "r_y3": 154.20799999999997, "coord_origin": "TOPLEFT"}, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.571, "r_y0": 183.971, "r_x1": 542.536, "r_y1": 183.971, "r_x2": 542.536, "r_y2": 177.043, "r_x3": 532.571, "r_y3": 177.043, "coord_origin": "TOPLEFT"}, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.146, "r_y0": 206.85900000000004, "r_x1": 542.111, "r_y1": 206.85900000000004, "r_x2": 542.111, "r_y2": 199.93100000000004, "r_x3": 532.146, "r_y3": 199.93100000000004, "coord_origin": "TOPLEFT"}, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 12, "label": "section_header", "bbox": {"l": 380.799, "t": 80.154, "r": 486.849, "b": 88.46699999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.5687217116355896, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.799, "r_y0": 88.46699999999998, "r_x1": 486.849, "r_y1": 88.46699999999998, "r_x2": 486.849, "r_y2": 80.154, "r_x3": 380.799, "r_y3": 80.154, "coord_origin": "TOPLEFT"}, "text": "PubTabNet + FinTabNet", "orig": "PubTabNet + FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 396.768, "t": 242.36900000000003, "r": 469.787, "b": 250.68200000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.768, "r_y0": 250.68200000000002, "r_x1": 469.787, "r_y1": 250.68200000000002, "r_x2": 469.787, "r_y2": 242.36900000000003, "r_x3": 396.768, "r_y3": 242.36900000000003, "coord_origin": "TOPLEFT"}, "text": "Rows / Columns", "orig": "Rows / Columns", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "text", "bbox": {"l": 320.977, "t": 233.65099999999995, "r": 324.793, "b": 239.19299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.977, "r_y0": 239.19299999999998, "r_x1": 324.793, "r_y1": 239.19299999999998, "r_x2": 324.793, "r_y2": 233.65099999999995, "r_x3": 320.977, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 410.483, "t": 233.65099999999995, "r": 418.113, "b": 239.19299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.483, "r_y0": 239.19299999999998, "r_x1": 418.113, "r_y1": 239.19299999999998, "r_x2": 418.113, "r_y2": 233.65099999999995, "r_x3": 410.483, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 500.85, "t": 233.65099999999995, "r": 508.48, "b": 239.19299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.85, "r_y0": 239.19299999999998, "r_x1": 508.48, "r_y1": 239.19299999999998, "r_x2": 508.48, "r_y2": 233.65099999999995, "r_x3": 500.85, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 365.3, "t": 233.65099999999995, "r": 372.93, "b": 239.19299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.3, "r_y0": 239.19299999999998, "r_x1": 372.93, "r_y1": 239.19299999999998, "r_x2": 372.93, "r_y2": 233.65099999999995, "r_x3": 365.3, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 455.666, "t": 233.65099999999995, "r": 463.296, "b": 239.19299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.666, "r_y0": 239.19299999999998, "r_x1": 463.296, "r_y1": 239.19299999999998, "r_x2": 463.296, "r_y2": 233.65099999999995, "r_x3": 455.666, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 542.035, "t": 233.65099999999995, "r": 549.665, "b": 239.19299999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 542.035, "r_y0": 239.19299999999998, "r_x1": 549.665, "r_y1": 239.19299999999998, "r_x2": 549.665, "r_y2": 233.65099999999995, "r_x3": 542.035, "r_y3": 233.65099999999995, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 316.045, "t": 230.67399999999998, "r": 319.861, "b": 236.21699999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 316.045, "r_y0": 236.21699999999998, "r_x1": 319.861, "r_y1": 236.21699999999998, "r_x2": 319.861, "r_y2": 230.67399999999998, "r_x3": 316.045, "r_y3": 230.67399999999998, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 312.625, "t": 198.91899999999998, "r": 320.255, "b": 204.461, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.625, "r_y0": 204.461, "r_x1": 320.255, "r_y1": 204.461, "r_x2": 320.255, "r_y2": 198.91899999999998, "r_x3": 312.625, "r_y3": 198.91899999999998, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 313.15, "t": 168.32600000000002, "r": 320.78, "b": 173.86800000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.15, "r_y0": 173.86800000000005, "r_x1": 320.78, "r_y1": 173.86800000000005, "r_x2": 320.78, "r_y2": 168.32600000000002, "r_x3": 313.15, "r_y3": 168.32600000000002, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 312.93, "t": 136.81600000000003, "r": 320.56, "b": 142.35799999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.93, "r_y0": 142.35799999999995, "r_x1": 320.56, "r_y1": 142.35799999999995, "r_x2": 320.56, "r_y2": 136.81600000000003, "r_x3": 312.93, "r_y3": 136.81600000000003, "coord_origin": "TOPLEFT"}, "text": "60", "orig": "60", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 312.482, "t": 105.83000000000004, "r": 320.112, "b": 111.37199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.482, "r_y0": 111.37199999999996, "r_x1": 320.112, "r_y1": 111.37199999999996, "r_x2": 320.112, "r_y2": 105.83000000000004, "r_x3": 312.482, "r_y3": 105.83000000000004, "coord_origin": "TOPLEFT"}, "text": "80", "orig": "80", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 312.482, "t": 212.48699999999997, "r": 320.112, "b": 218.02999999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.482, "r_y0": 218.02999999999997, "r_x1": 320.112, "r_y1": 218.02999999999997, "r_x2": 320.112, "r_y2": 212.48699999999997, "r_x3": 312.482, "r_y3": 212.48699999999997, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 313.076, "t": 183.95000000000005, "r": 320.707, "b": 189.49199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.076, "r_y0": 189.49199999999996, "r_x1": 320.707, "r_y1": 189.49199999999996, "r_x2": 320.707, "r_y2": 183.95000000000005, "r_x3": 313.076, "r_y3": 183.95000000000005, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 312.763, "t": 152.702, "r": 320.393, "b": 158.24400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.763, "r_y0": 158.24400000000003, "r_x1": 320.393, "r_y1": 158.24400000000003, "r_x2": 320.393, "r_y2": 152.702, "r_x3": 312.763, "r_y3": 152.702, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 312.198, "t": 120.798, "r": 319.828, "b": 126.34100000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.198, "r_y0": 126.34100000000001, "r_x1": 319.828, "r_y1": 126.34100000000001, "r_x2": 319.828, "r_y2": 120.798, "r_x3": 312.198, "r_y3": 120.798, "coord_origin": "TOPLEFT"}, "text": "70", "orig": "70", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 312.817, "t": 90.33699999999999, "r": 320.447, "b": 95.87900000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.817, "r_y0": 95.87900000000002, "r_x1": 320.447, "r_y1": 95.87900000000002, "r_x2": 320.447, "r_y2": 90.33699999999999, "r_x3": 312.817, "r_y3": 90.33699999999999, "coord_origin": "TOPLEFT"}, "text": "90", "orig": "90", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 532.174, "t": 223.01199999999994, "r": 536.944, "b": 229.94000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.174, "r_y0": 229.94000000000005, "r_x1": 536.944, "r_y1": 229.94000000000005, "r_x2": 536.944, "r_y2": 223.01199999999994, "r_x3": 532.174, "r_y3": 223.01199999999994, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 532.88, "t": 108.55200000000002, "r": 547.613, "b": 115.48000000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.88, "r_y0": 115.48000000000002, "r_x1": 547.613, "r_y1": 115.48000000000002, "r_x2": 547.613, "r_y2": 108.55200000000002, "r_x3": 532.88, "r_y3": 108.55200000000002, "coord_origin": "TOPLEFT"}, "text": "10K", "orig": "10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 532.774, "t": 131.06600000000003, "r": 542.739, "b": 137.99400000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.774, "r_y0": 137.99400000000003, "r_x1": 542.739, "r_y1": 137.99400000000003, "r_x2": 542.739, "r_y2": 131.06600000000003, "r_x3": 532.774, "r_y3": 131.06600000000003, "coord_origin": "TOPLEFT"}, "text": "8K", "orig": "8K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 532.799, "t": 154.20799999999997, "r": 542.764, "b": 161.13599999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.799, "r_y0": 161.13599999999997, "r_x1": 542.764, "r_y1": 161.13599999999997, "r_x2": 542.764, "r_y2": 154.20799999999997, "r_x3": 532.799, "r_y3": 154.20799999999997, "coord_origin": "TOPLEFT"}, "text": "6K", "orig": "6K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 532.571, "t": 177.043, "r": 542.536, "b": 183.971, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.571, "r_y0": 183.971, "r_x1": 542.536, "r_y1": 183.971, "r_x2": 542.536, "r_y2": 177.043, "r_x3": 532.571, "r_y3": 177.043, "coord_origin": "TOPLEFT"}, "text": "4K", "orig": "4K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 532.146, "t": 199.93100000000004, "r": 542.111, "b": 206.85900000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.146, "r_y0": 206.85900000000004, "r_x1": 542.111, "r_y1": 206.85900000000004, "r_x2": 542.111, "r_y2": 199.93100000000004, "r_x3": 532.146, "r_y3": 199.93100000000004, "coord_origin": "TOPLEFT"}, "text": "2K", "orig": "2K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "caption", "id": 7, "page_no": 2, "cluster": {"id": 7, "label": "caption", "bbox": {"l": 308.862, "t": 268.105, "r": 545.115, "b": 288.612, "coord_origin": "TOPLEFT"}, "confidence": 0.9667505025863647, "cells": [{"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 276.65700000000004, "r_x1": 346.062, "r_y1": 276.65700000000004, "r_x2": 346.062, "r_y2": 268.105, "r_x3": 308.862, "r_y3": 268.105, "coord_origin": "TOPLEFT"}, "text": "Figure 2:", "orig": "Figure 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.491, "r_y0": 276.65700000000004, "r_x1": 545.115, "r_y1": 276.65700000000004, "r_x2": 545.115, "r_y2": 268.105, "r_x3": 354.491, "r_y3": 268.105, "coord_origin": "TOPLEFT"}, "text": "Distribution of the tables across different table", "orig": "Distribution of the tables across different table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 288.612, "r_x1": 498.57, "r_y1": 288.612, "r_x2": 498.57, "r_y2": 280.06, "r_x3": 308.862, "r_y3": 280.06, "coord_origin": "TOPLEFT"}, "text": "dimensions in PubTabNet + FinTabNet datasets", "orig": "dimensions in PubTabNet + FinTabNet datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 2: Distribution of the tables across different table dimensions in PubTabNet + FinTabNet datasets"}, {"label": "text", "id": 9, "page_no": 2, "cluster": {"id": 9, "label": "text", "bbox": {"l": 308.862, "t": 317.742, "r": 437.27, "b": 326.294, "coord_origin": "TOPLEFT"}, "confidence": 0.8879811763763428, "cells": [{"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 326.294, "r_x1": 437.27, "r_y1": 326.294, "r_x2": 437.27, "r_y2": 317.742, "r_x3": 308.862, "r_y3": 317.742, "coord_origin": "TOPLEFT"}, "text": "balance in the previous datasets.", "orig": "balance in the previous datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "balance in the previous datasets."}, {"label": "text", "id": 2, "page_no": 2, "cluster": {"id": 2, "label": "text", "bbox": {"l": 308.862, "t": 331.8, "r": 545.115, "b": 627.2760000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9870319366455078, "cells": [{"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 340.352, "r_x1": 545.115, "r_y1": 340.352, "r_x2": 545.115, "r_y2": 331.8, "r_x3": 320.817, "r_y3": 331.8, "coord_origin": "TOPLEFT"}, "text": "The PubTabNet dataset contains 509k tables delivered as", "orig": "The PubTabNet dataset contains 509k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 352.307, "r_x1": 545.115, "r_y1": 352.307, "r_x2": 545.115, "r_y2": 343.755, "r_x3": 308.862, "r_y3": 343.755, "coord_origin": "TOPLEFT"}, "text": "annotated PNGimages. The annotations consist of the table", "orig": "annotated PNGimages. The annotations consist of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 364.263, "r_x1": 545.115, "r_y1": 364.263, "r_x2": 545.115, "r_y2": 355.711, "r_x3": 308.862, "r_y3": 355.711, "coord_origin": "TOPLEFT"}, "text": "structure represented in HTML format, the tokenized text", "orig": "structure represented in HTML format, the tokenized text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 376.218, "r_x1": 545.115, "r_y1": 376.218, "r_x2": 545.115, "r_y2": 367.666, "r_x3": 308.862, "r_y3": 367.666, "coord_origin": "TOPLEFT"}, "text": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "orig": "and its bounding boxes per table cell. Fig. 1 shows the ap-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 388.173, "r_x1": 545.115, "r_y1": 388.173, "r_x2": 545.115, "r_y2": 379.621, "r_x3": 308.862, "r_y3": 379.621, "coord_origin": "TOPLEFT"}, "text": "pearance style of PubTabNet. Depending on its complexity,", "orig": "pearance style of PubTabNet. Depending on its complexity,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 400.128, "r_x1": 545.115, "r_y1": 400.128, "r_x2": 545.115, "r_y2": 391.576, "r_x3": 308.862, "r_y3": 391.576, "coord_origin": "TOPLEFT"}, "text": "a table is characterized as 'simple' when it does not contain", "orig": "a table is characterized as 'simple' when it does not contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 412.083, "r_x1": 545.115, "r_y1": 412.083, "r_x2": 545.115, "r_y2": 403.531, "r_x3": 308.862, "r_y3": 403.531, "coord_origin": "TOPLEFT"}, "text": "row spans or column spans, otherwise it is 'complex'. The", "orig": "row spans or column spans, otherwise it is 'complex'. The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 424.038, "r_x1": 545.115, "r_y1": 424.038, "r_x2": 545.115, "r_y2": 415.486, "r_x3": 308.862, "r_y3": 415.486, "coord_origin": "TOPLEFT"}, "text": "dataset is divided into Train and Val splits (roughly 98%and", "orig": "dataset is divided into Train and Val splits (roughly 98%and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 435.994, "r_x1": 545.115, "r_y1": 435.994, "r_x2": 545.115, "r_y2": 427.442, "r_x3": 308.862, "r_y3": 427.442, "coord_origin": "TOPLEFT"}, "text": "2%). The Train split consists of 54% simple and 46% com-", "orig": "2%). The Train split consists of 54% simple and 46% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 447.949, "r_x1": 545.115, "r_y1": 447.949, "r_x2": 545.115, "r_y2": 439.397, "r_x3": 308.862, "r_y3": 439.397, "coord_origin": "TOPLEFT"}, "text": "plex tables and the Val split of 51% and 49% respectively.", "orig": "plex tables and the Val split of 51% and 49% respectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 459.904, "r_x1": 545.115, "r_y1": 459.904, "r_x2": 545.115, "r_y2": 451.352, "r_x3": 308.862, "r_y3": 451.352, "coord_origin": "TOPLEFT"}, "text": "The FinTabNet dataset contains 112k tables delivered as", "orig": "The FinTabNet dataset contains 112k tables delivered as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 471.859, "r_x1": 545.115, "r_y1": 471.859, "r_x2": 545.115, "r_y2": 463.307, "r_x3": 308.862, "r_y3": 463.307, "coord_origin": "TOPLEFT"}, "text": "single-page PDFdocuments with mixed table structures and", "orig": "single-page PDFdocuments with mixed table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 483.814, "r_x1": 358.984, "r_y1": 483.814, "r_x2": 358.984, "r_y2": 475.262, "r_x3": 308.862, "r_y3": 475.262, "coord_origin": "TOPLEFT"}, "text": "text content.", "orig": "text content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.121, "r_y0": 483.814, "r_x1": 545.115, "r_y1": 483.814, "r_x2": 545.115, "r_y2": 475.262, "r_x3": 365.121, "r_y3": 475.262, "coord_origin": "TOPLEFT"}, "text": "Similarly to the PubTabNet, the annotations", "orig": "Similarly to the PubTabNet, the annotations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 495.77, "r_x1": 545.115, "r_y1": 495.77, "r_x2": 545.115, "r_y2": 487.218, "r_x3": 308.862, "r_y3": 487.218, "coord_origin": "TOPLEFT"}, "text": "of FinTabNet include the table structure in HTML, the to-", "orig": "of FinTabNet include the table structure in HTML, the to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 507.725, "r_x1": 545.115, "r_y1": 507.725, "r_x2": 545.115, "r_y2": 499.173, "r_x3": 308.862, "r_y3": 499.173, "coord_origin": "TOPLEFT"}, "text": "kenized text and the bounding boxes on a table cell basis.", "orig": "kenized text and the bounding boxes on a table cell basis.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 519.6800000000001, "r_x1": 545.115, "r_y1": 519.6800000000001, "r_x2": 545.115, "r_y2": 511.128, "r_x3": 308.862, "r_y3": 511.128, "coord_origin": "TOPLEFT"}, "text": "The dataset is divided into Train, Test and Val splits (81%,", "orig": "The dataset is divided into Train, Test and Val splits (81%,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 531.635, "r_x1": 545.115, "r_y1": 531.635, "r_x2": 545.115, "r_y2": 523.0830000000001, "r_x3": 308.862, "r_y3": 523.0830000000001, "coord_origin": "TOPLEFT"}, "text": "9.5%, 9.5%), and each one is almost equally divided into", "orig": "9.5%, 9.5%), and each one is almost equally divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 543.59, "r_x1": 545.115, "r_y1": 543.59, "r_x2": 545.115, "r_y2": 535.038, "r_x3": 308.862, "r_y3": 535.038, "coord_origin": "TOPLEFT"}, "text": "simple and complex tables (Train: 48% simple, 52% com-", "orig": "simple and complex tables (Train: 48% simple, 52% com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 555.545, "r_x1": 350.964, "r_y1": 555.545, "r_x2": 350.964, "r_y2": 546.9929999999999, "r_x3": 308.862, "r_y3": 546.9929999999999, "coord_origin": "TOPLEFT"}, "text": "plex, Test:", "orig": "plex, Test:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 355.467, "r_y0": 555.545, "r_x1": 490.082, "r_y1": 555.545, "r_x2": 490.082, "r_y2": 546.9929999999999, "r_x3": 355.467, "r_y3": 546.9929999999999, "coord_origin": "TOPLEFT"}, "text": "48% simple, 52% complex, Test:", "orig": "48% simple, 52% complex, Test:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 494.595, "r_y0": 555.545, "r_x1": 545.115, "r_y1": 555.545, "r_x2": 545.115, "r_y2": 546.9929999999999, "r_x3": 494.595, "r_y3": 546.9929999999999, "coord_origin": "TOPLEFT"}, "text": "53% simple,", "orig": "53% simple,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 567.501, "r_x1": 370.6, "r_y1": 567.501, "r_x2": 370.6, "r_y2": 558.9490000000001, "r_x3": 308.862, "r_y3": 558.9490000000001, "coord_origin": "TOPLEFT"}, "text": "47% complex).", "orig": "47% complex).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.737, "r_y0": 567.501, "r_x1": 545.115, "r_y1": 567.501, "r_x2": 545.115, "r_y2": 558.9490000000001, "r_x3": 376.737, "r_y3": 558.9490000000001, "coord_origin": "TOPLEFT"}, "text": "Finally the TableBank dataset consists of", "orig": "Finally the TableBank dataset consists of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 579.456, "r_x1": 545.115, "r_y1": 579.456, "r_x2": 545.115, "r_y2": 570.904, "r_x3": 308.862, "r_y3": 570.904, "coord_origin": "TOPLEFT"}, "text": "145k tables provided as JPEG images. The latter has anno-", "orig": "145k tables provided as JPEG images. The latter has anno-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 591.4110000000001, "r_x1": 545.115, "r_y1": 591.4110000000001, "r_x2": 545.115, "r_y2": 582.859, "r_x3": 308.862, "r_y3": 582.859, "coord_origin": "TOPLEFT"}, "text": "tations for the table structure, but only few with bounding", "orig": "tations for the table structure, but only few with bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 603.366, "r_x1": 403.726, "r_y1": 603.366, "r_x2": 403.726, "r_y2": 594.814, "r_x3": 308.862, "r_y3": 594.814, "coord_origin": "TOPLEFT"}, "text": "boxes of the table cells.", "orig": "boxes of the table cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.731, "r_y0": 603.366, "r_x1": 545.115, "r_y1": 603.366, "r_x2": 545.115, "r_y2": 594.814, "r_x3": 407.731, "r_y3": 594.814, "coord_origin": "TOPLEFT"}, "text": "The entire dataset consists of sim-", "orig": "The entire dataset consists of sim-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 615.321, "r_x1": 545.115, "r_y1": 615.321, "r_x2": 545.115, "r_y2": 606.769, "r_x3": 308.862, "r_y3": 606.769, "coord_origin": "TOPLEFT"}, "text": "ple tables and it is divided into 90% Train, 3% Test and 7%", "orig": "ple tables and it is divided into 90% Train, 3% Test and 7%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 627.2760000000001, "r_x1": 348.164, "r_y1": 627.2760000000001, "r_x2": 348.164, "r_y2": 618.7239999999999, "r_x3": 308.862, "r_y3": 618.7239999999999, "coord_origin": "TOPLEFT"}, "text": "Val splits.", "orig": "Val splits.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The PubTabNet dataset contains 509k tables delivered as annotated PNGimages. The annotations consist of the table structure represented in HTML format, the tokenized text and its bounding boxes per table cell. Fig. 1 shows the appearance style of PubTabNet. Depending on its complexity, a table is characterized as 'simple' when it does not contain row spans or column spans, otherwise it is 'complex'. The dataset is divided into Train and Val splits (roughly 98%and 2%). The Train split consists of 54% simple and 46% complex tables and the Val split of 51% and 49% respectively. The FinTabNet dataset contains 112k tables delivered as single-page PDFdocuments with mixed table structures and text content. Similarly to the PubTabNet, the annotations of FinTabNet include the table structure in HTML, the tokenized text and the bounding boxes on a table cell basis. The dataset is divided into Train, Test and Val splits (81%, 9.5%, 9.5%), and each one is almost equally divided into simple and complex tables (Train: 48% simple, 52% complex, Test: 48% simple, 52% complex, Test: 53% simple, 47% complex). Finally the TableBank dataset consists of 145k tables provided as JPEG images. The latter has annotations for the table structure, but only few with bounding boxes of the table cells. The entire dataset consists of simple tables and it is divided into 90% Train, 3% Test and 7% Val splits."}, {"label": "text", "id": 4, "page_no": 2, "cluster": {"id": 4, "label": "text", "bbox": {"l": 308.862, "t": 632.783, "r": 545.115, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9840091466903687, "cells": [{"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 641.335, "r_x1": 545.115, "r_y1": 641.335, "r_x2": 545.115, "r_y2": 632.783, "r_x3": 320.817, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "Due to the heterogeneity across the dataset formats, it", "orig": "Due to the heterogeneity across the dataset formats, it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.29, "r_x1": 545.115, "r_y1": 653.29, "r_x2": 545.115, "r_y2": 644.738, "r_x3": 308.862, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "was necessary to combine all available data into one homog-", "orig": "was necessary to combine all available data into one homog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 665.245, "r_x1": 545.115, "r_y1": 665.245, "r_x2": 545.115, "r_y2": 656.693, "r_x3": 308.862, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "enized dataset before we could train our models for practi-", "orig": "enized dataset before we could train our models for practi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 677.201, "r_x1": 361.245, "r_y1": 677.201, "r_x2": 361.245, "r_y2": 668.649, "r_x3": 308.862, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "cal purposes.", "orig": "cal purposes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.44, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 365.44, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "Given the size of PubTabNet, we adopted its", "orig": "Given the size of PubTabNet, we adopted its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 308.862, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "annotation format and we extracted and converted all tables", "orig": "annotation format and we extracted and converted all tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 487.322, "r_y1": 701.111, "r_x2": 487.322, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "as PNG images with a resolution of 72 dpi.", "orig": "as PNG images with a resolution of 72 dpi.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 492.901, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 492.901, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Additionally,", "orig": "Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "we have filtered out tables with extreme sizes due to small", "orig": "we have filtered out tables with extreme sizes due to small", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Due to the heterogeneity across the dataset formats, it was necessary to combine all available data into one homogenized dataset before we could train our models for practical purposes. Given the size of PubTabNet, we adopted its annotation format and we extracted and converted all tables as PNG images with a resolution of 72 dpi. Additionally, we have filtered out tables with extreme sizes due to small"}], "headers": [{"label": "page_footer", "id": 11, "page_no": 2, "cluster": {"id": 11, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8715606927871704, "cells": [{"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3"}]}}, {"page_no": 3, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "amount of such tables, and kept only those ones ranging", "orig": "amount of such tables, and kept only those ones ranging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 95.98400000000004, "r_x1": 212.283, "r_y1": 95.98400000000004, "r_x2": 212.283, "r_y2": 87.43200000000002, "r_x3": 50.112, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "between 1*1 and 20*10 (rows/columns).", "orig": "between 1*1 and 20*10 (rows/columns).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 109.78099999999995, "r_x1": 286.365, "r_y1": 109.78099999999995, "r_x2": 286.365, "r_y2": 101.22900000000004, "r_x3": 62.067, "r_y3": 101.22900000000004, "coord_origin": "TOPLEFT"}, "text": "The availability of the bounding boxes for all table cells", "orig": "The availability of the bounding boxes for all table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 121.73599999999999, "r_x1": 176.458, "r_y1": 121.73599999999999, "r_x2": 176.458, "r_y2": 113.18399999999997, "r_x3": 50.112, "r_y3": 113.18399999999997, "coord_origin": "TOPLEFT"}, "text": "is essential to train our models.", "orig": "is essential to train our models.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.971, "r_y0": 121.73599999999999, "r_x1": 286.365, "r_y1": 121.73599999999999, "r_x2": 286.365, "r_y2": 113.18399999999997, "r_x3": 180.971, "r_y3": 113.18399999999997, "coord_origin": "TOPLEFT"}, "text": "In order to distinguish be-", "orig": "In order to distinguish be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 133.69100000000003, "r_x1": 286.365, "r_y1": 133.69100000000003, "r_x2": 286.365, "r_y2": 125.13900000000001, "r_x3": 50.112, "r_y3": 125.13900000000001, "coord_origin": "TOPLEFT"}, "text": "tween empty and non-empty bounding boxes, we have in-", "orig": "tween empty and non-empty bounding boxes, we have in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 145.64700000000005, "r_x1": 286.365, "r_y1": 145.64700000000005, "r_x2": 286.365, "r_y2": 137.09500000000003, "r_x3": 50.112, "r_y3": 137.09500000000003, "coord_origin": "TOPLEFT"}, "text": "troduced a binary class in the annotation. Unfortunately, the", "orig": "troduced a binary class in the annotation. Unfortunately, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 157.60199999999998, "r_x1": 286.365, "r_y1": 157.60199999999998, "r_x2": 286.365, "r_y2": 149.04999999999995, "r_x3": 50.112, "r_y3": 149.04999999999995, "coord_origin": "TOPLEFT"}, "text": "original datasets either omit the bounding boxes for whole", "orig": "original datasets either omit the bounding boxes for whole", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 169.55700000000002, "r_x1": 94.127, "r_y1": 169.55700000000002, "r_x2": 94.127, "r_y2": 161.005, "r_x3": 50.112, "r_y3": 161.005, "coord_origin": "TOPLEFT"}, "text": "tables (e.g.", "orig": "tables (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 98.959, "r_y0": 169.55700000000002, "r_x1": 286.365, "r_y1": 169.55700000000002, "r_x2": 286.365, "r_y2": 161.005, "r_x3": 98.959, "r_y3": 161.005, "coord_origin": "TOPLEFT"}, "text": "TableBank) or they narrow their scope only to", "orig": "TableBank) or they narrow their scope only to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 181.51199999999994, "r_x1": 116.951, "r_y1": 181.51199999999994, "r_x2": 116.951, "r_y2": 172.96000000000004, "r_x3": 50.112, "r_y3": 172.96000000000004, "coord_origin": "TOPLEFT"}, "text": "non-empty cells.", "orig": "non-empty cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 121.345, "r_y0": 181.51199999999994, "r_x1": 286.365, "r_y1": 181.51199999999994, "r_x2": 286.365, "r_y2": 172.96000000000004, "r_x3": 121.345, "r_y3": 172.96000000000004, "coord_origin": "TOPLEFT"}, "text": "Therefore, it was imperative to introduce", "orig": "Therefore, it was imperative to introduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 193.46699999999998, "r_x1": 286.365, "r_y1": 193.46699999999998, "r_x2": 286.365, "r_y2": 184.91499999999996, "r_x3": 50.112, "r_y3": 184.91499999999996, "coord_origin": "TOPLEFT"}, "text": "a data pre-processing procedure that generates the missing", "orig": "a data pre-processing procedure that generates the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 205.423, "r_x1": 286.365, "r_y1": 205.423, "r_x2": 286.365, "r_y2": 196.87099999999998, "r_x3": 50.112, "r_y3": 196.87099999999998, "coord_origin": "TOPLEFT"}, "text": "bounding boxes out of the annotation information. This pro-", "orig": "bounding boxes out of the annotation information. This pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 217.37800000000004, "r_x1": 286.365, "r_y1": 217.37800000000004, "r_x2": 286.365, "r_y2": 208.82600000000002, "r_x3": 50.112, "r_y3": 208.82600000000002, "coord_origin": "TOPLEFT"}, "text": "cedure first parses the provided table structure and calcu-", "orig": "cedure first parses the provided table structure and calcu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 229.33299999999997, "r_x1": 286.365, "r_y1": 229.33299999999997, "r_x2": 286.365, "r_y2": 220.78099999999995, "r_x3": 50.112, "r_y3": 220.78099999999995, "coord_origin": "TOPLEFT"}, "text": "lates the dimensions of the most fine-grained grid that cov-", "orig": "lates the dimensions of the most fine-grained grid that cov-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 241.288, "r_x1": 139.805, "r_y1": 241.288, "r_x2": 139.805, "r_y2": 232.736, "r_x3": 50.112, "r_y3": 232.736, "coord_origin": "TOPLEFT"}, "text": "ers the table structure.", "orig": "ers the table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 144.607, "r_y0": 241.288, "r_x1": 286.365, "r_y1": 241.288, "r_x2": 286.365, "r_y2": 232.736, "r_x3": 144.607, "r_y3": 232.736, "coord_origin": "TOPLEFT"}, "text": "Notice that each table cell may oc-", "orig": "Notice that each table cell may oc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 253.24300000000005, "r_x1": 286.365, "r_y1": 253.24300000000005, "r_x2": 286.365, "r_y2": 244.69100000000003, "r_x3": 50.112, "r_y3": 244.69100000000003, "coord_origin": "TOPLEFT"}, "text": "cupy multiple grid squares due to row or column spans. In", "orig": "cupy multiple grid squares due to row or column spans. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 265.198, "r_x1": 286.365, "r_y1": 265.198, "r_x2": 286.365, "r_y2": 256.64599999999996, "r_x3": 50.112, "r_y3": 256.64599999999996, "coord_origin": "TOPLEFT"}, "text": "case of PubTabNet we had to compute missing bounding", "orig": "case of PubTabNet we had to compute missing bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 277.154, "r_x1": 286.365, "r_y1": 277.154, "r_x2": 286.365, "r_y2": 268.602, "r_x3": 50.112, "r_y3": 268.602, "coord_origin": "TOPLEFT"}, "text": "boxes for 48% of the simple and 69% of the complex ta-", "orig": "boxes for 48% of the simple and 69% of the complex ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 289.109, "r_x1": 68.652, "r_y1": 289.109, "r_x2": 68.652, "r_y2": 280.557, "r_x3": 50.112, "r_y3": 280.557, "coord_origin": "TOPLEFT"}, "text": "bles.", "orig": "bles.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 75.566, "r_y0": 289.109, "r_x1": 286.365, "r_y1": 289.109, "r_x2": 286.365, "r_y2": 280.557, "r_x3": 75.566, "r_y3": 280.557, "coord_origin": "TOPLEFT"}, "text": "Regarding FinTabNet, 68% of the simple and 98%", "orig": "Regarding FinTabNet, 68% of the simple and 98%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 301.064, "r_x1": 286.365, "r_y1": 301.064, "r_x2": 286.365, "r_y2": 292.512, "r_x3": 50.112, "r_y3": 292.512, "coord_origin": "TOPLEFT"}, "text": "of the complex tables require the generation of bounding", "orig": "of the complex tables require the generation of bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 313.019, "r_x1": 75.696, "r_y1": 313.019, "r_x2": 75.696, "r_y2": 304.467, "r_x3": 50.112, "r_y3": 304.467, "coord_origin": "TOPLEFT"}, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 326.816, "r_x1": 286.365, "r_y1": 326.816, "r_x2": 286.365, "r_y2": 318.264, "r_x3": 62.067, "r_y3": 318.264, "coord_origin": "TOPLEFT"}, "text": "As it is illustrated in Fig. 2, the table distributions from", "orig": "As it is illustrated in Fig. 2, the table distributions from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 338.772, "r_x1": 60.075, "r_y1": 338.772, "r_x2": 60.075, "r_y2": 330.22, "r_x3": 50.112, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.146, "r_y0": 338.772, "r_x1": 96.687, "r_y1": 338.772, "r_x2": 96.687, "r_y2": 330.22, "r_x3": 65.146, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "datasets", "orig": "datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.768, "r_y0": 338.772, "r_x1": 113.932, "r_y1": 338.772, "r_x2": 113.932, "r_y2": 330.22, "r_x3": 101.768, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "are", "orig": "are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.003, "r_y0": 338.772, "r_x1": 148.533, "r_y1": 338.772, "r_x2": 148.533, "r_y2": 330.22, "r_x3": 119.003, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "skewed", "orig": "skewed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.613, "r_y0": 338.772, "r_x1": 184.806, "r_y1": 338.772, "r_x2": 184.806, "r_y2": 330.22, "r_x3": 153.613, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "towards", "orig": "towards", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 189.877, "r_y0": 338.772, "r_x1": 219.765, "r_y1": 338.772, "r_x2": 219.765, "r_y2": 330.22, "r_x3": 189.877, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "simpler", "orig": "simpler", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.836, "r_y0": 338.772, "r_x1": 263.571, "r_y1": 338.772, "r_x2": 263.571, "r_y2": 330.22, "r_x3": 224.836, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "structures", "orig": "structures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 268.652, "r_y0": 338.772, "r_x1": 286.365, "r_y1": 338.772, "r_x2": 286.365, "r_y2": 330.22, "r_x3": 268.652, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 350.727, "r_x1": 286.365, "r_y1": 350.727, "r_x2": 286.365, "r_y2": 342.175, "r_x3": 50.112, "r_y3": 342.175, "coord_origin": "TOPLEFT"}, "text": "fewer number of rows/columns. Additionally, there is very", "orig": "fewer number of rows/columns. Additionally, there is very", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 362.682, "r_x1": 286.365, "r_y1": 362.682, "r_x2": 286.365, "r_y2": 354.13, "r_x3": 50.112, "r_y3": 354.13, "coord_origin": "TOPLEFT"}, "text": "limited variance in the table styles, which in case of Pub-", "orig": "limited variance in the table styles, which in case of Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 374.637, "r_x1": 286.365, "r_y1": 374.637, "r_x2": 286.365, "r_y2": 366.085, "r_x3": 50.112, "r_y3": 366.085, "coord_origin": "TOPLEFT"}, "text": "TabNet and FinTabNet means one styling format for the", "orig": "TabNet and FinTabNet means one styling format for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 386.592, "r_x1": 141.589, "r_y1": 386.592, "r_x2": 141.589, "r_y2": 378.04, "r_x3": 50.112, "r_y3": 378.04, "coord_origin": "TOPLEFT"}, "text": "majority of the tables.", "orig": "majority of the tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.702, "r_y0": 386.592, "r_x1": 286.365, "r_y1": 386.592, "r_x2": 286.365, "r_y2": 378.04, "r_x3": 148.702, "r_y3": 378.04, "coord_origin": "TOPLEFT"}, "text": "Similar limitations appear also in", "orig": "Similar limitations appear also in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 398.547, "r_x1": 286.365, "r_y1": 398.547, "r_x2": 286.365, "r_y2": 389.995, "r_x3": 50.112, "r_y3": 389.995, "coord_origin": "TOPLEFT"}, "text": "the type of table content, which in some cases (e.g. FinTab-", "orig": "the type of table content, which in some cases (e.g. FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 410.503, "r_x1": 201.822, "r_y1": 410.503, "r_x2": 201.822, "r_y2": 401.951, "r_x3": 50.112, "r_y3": 401.951, "coord_origin": "TOPLEFT"}, "text": "Net) is restricted to a certain domain.", "orig": "Net) is restricted to a certain domain.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.764, "r_y0": 410.503, "r_x1": 286.365, "r_y1": 410.503, "r_x2": 286.365, "r_y2": 401.951, "r_x3": 206.764, "r_y3": 401.951, "coord_origin": "TOPLEFT"}, "text": "Ultimately, the lack", "orig": "Ultimately, the lack", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 422.458, "r_x1": 286.365, "r_y1": 422.458, "r_x2": 286.365, "r_y2": 413.906, "r_x3": 50.112, "r_y3": 413.906, "coord_origin": "TOPLEFT"}, "text": "of diversity in the training dataset damages the ability of the", "orig": "of diversity in the training dataset damages the ability of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 434.413, "r_x1": 216.398, "r_y1": 434.413, "r_x2": 216.398, "r_y2": 425.861, "r_x3": 50.112, "r_y3": 425.861, "coord_origin": "TOPLEFT"}, "text": "models to generalize well on unseen data.", "orig": "models to generalize well on unseen data.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 448.21, "r_x1": 286.365, "r_y1": 448.21, "r_x2": 286.365, "r_y2": 439.658, "r_x3": 62.067, "r_y3": 439.658, "coord_origin": "TOPLEFT"}, "text": "Motivated by those observations we aimed at generating", "orig": "Motivated by those observations we aimed at generating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 460.165, "r_x1": 172.144, "r_y1": 460.165, "r_x2": 172.144, "r_y2": 451.613, "r_x3": 50.112, "r_y3": 451.613, "coord_origin": "TOPLEFT"}, "text": "a synthetic table dataset named", "orig": "a synthetic table dataset named", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 174.148, "r_y0": 460.022, "r_x1": 224.708, "r_y1": 460.022, "r_x2": 224.708, "r_y2": 451.434, "r_x3": 174.148, "r_y3": 451.434, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.708, "r_y0": 460.165, "r_x1": 227.199, "r_y1": 460.165, "r_x2": 227.199, "r_y2": 451.613, "r_x3": 224.708, "r_y3": 451.613, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 230.128, "r_y0": 460.165, "r_x1": 286.367, "r_y1": 460.165, "r_x2": 286.367, "r_y2": 451.613, "r_x3": 230.128, "r_y3": 451.613, "coord_origin": "TOPLEFT"}, "text": "This approach", "orig": "This approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 472.121, "r_x1": 128.179, "r_y1": 472.121, "r_x2": 128.179, "r_y2": 463.569, "r_x3": 50.112, "r_y3": 463.569, "coord_origin": "TOPLEFT"}, "text": "offers control over:", "orig": "offers control over:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.971, "r_y0": 472.121, "r_x1": 286.365, "r_y1": 472.121, "r_x2": 286.365, "r_y2": 463.569, "r_x3": 132.971, "r_y3": 463.569, "coord_origin": "TOPLEFT"}, "text": "1) the size of the dataset, 2) the table", "orig": "1) the size of the dataset, 2) the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 484.076, "r_x1": 266.739, "r_y1": 484.076, "r_x2": 266.739, "r_y2": 475.524, "r_x3": 50.112, "r_y3": 475.524, "coord_origin": "TOPLEFT"}, "text": "structure, 3) the table style and 4) the type of content.", "orig": "structure, 3) the table style and 4) the type of content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.873, "r_y0": 484.076, "r_x1": 286.365, "r_y1": 484.076, "r_x2": 286.365, "r_y2": 475.524, "r_x3": 270.873, "r_y3": 475.524, "coord_origin": "TOPLEFT"}, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 496.031, "r_x1": 286.365, "r_y1": 496.031, "r_x2": 286.365, "r_y2": 487.479, "r_x3": 50.112, "r_y3": 487.479, "coord_origin": "TOPLEFT"}, "text": "complexity of the table structure is described by the size of", "orig": "complexity of the table structure is described by the size of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 507.986, "r_x1": 286.365, "r_y1": 507.986, "r_x2": 286.365, "r_y2": 499.434, "r_x3": 50.112, "r_y3": 499.434, "coord_origin": "TOPLEFT"}, "text": "the table header and the table body, as well as the percentage", "orig": "the table header and the table body, as well as the percentage", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 519.941, "r_x1": 286.365, "r_y1": 519.941, "r_x2": 286.365, "r_y2": 511.389, "r_x3": 50.112, "r_y3": 511.389, "coord_origin": "TOPLEFT"}, "text": "of the table cells covered by row spans and column spans.", "orig": "of the table cells covered by row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 531.8969999999999, "r_x1": 286.365, "r_y1": 531.8969999999999, "r_x2": 286.365, "r_y2": 523.345, "r_x3": 50.112, "r_y3": 523.345, "coord_origin": "TOPLEFT"}, "text": "A set of carefully designed styling templates provides the", "orig": "A set of carefully designed styling templates provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 543.852, "r_x1": 286.365, "r_y1": 543.852, "r_x2": 286.365, "r_y2": 535.3, "r_x3": 50.112, "r_y3": 535.3, "coord_origin": "TOPLEFT"}, "text": "basis to build a wide range of table appearances. Lastly, the", "orig": "basis to build a wide range of table appearances. Lastly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 555.807, "r_x1": 286.365, "r_y1": 555.807, "r_x2": 286.365, "r_y2": 547.255, "r_x3": 50.112, "r_y3": 547.255, "coord_origin": "TOPLEFT"}, "text": "table content is generated out of a curated collection of text", "orig": "table content is generated out of a curated collection of text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 567.762, "r_x1": 83.028, "r_y1": 567.762, "r_x2": 83.028, "r_y2": 559.21, "r_x3": 50.112, "r_y3": 559.21, "coord_origin": "TOPLEFT"}, "text": "corpora.", "orig": "corpora.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.153, "r_y0": 567.762, "r_x1": 286.365, "r_y1": 567.762, "r_x2": 286.365, "r_y2": 559.21, "r_x3": 87.153, "r_y3": 559.21, "coord_origin": "TOPLEFT"}, "text": "By controlling the size and scope of the synthetic", "orig": "By controlling the size and scope of the synthetic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 579.717, "r_x1": 286.365, "r_y1": 579.717, "r_x2": 286.365, "r_y2": 571.165, "r_x3": 50.112, "r_y3": 571.165, "coord_origin": "TOPLEFT"}, "text": "datasets we are able to train and evaluate our models in a", "orig": "datasets we are able to train and evaluate our models in a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 591.672, "r_x1": 174.645, "r_y1": 591.672, "r_x2": 174.645, "r_y2": 583.12, "r_x3": 50.112, "r_y3": 583.12, "coord_origin": "TOPLEFT"}, "text": "variety of different conditions.", "orig": "variety of different conditions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.021, "r_y0": 591.672, "r_x1": 286.365, "r_y1": 591.672, "r_x2": 286.365, "r_y2": 583.12, "r_x3": 181.021, "r_y3": 583.12, "coord_origin": "TOPLEFT"}, "text": "For example, we can first", "orig": "For example, we can first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 603.6279999999999, "r_x1": 286.365, "r_y1": 603.6279999999999, "r_x2": 286.365, "r_y2": 595.076, "r_x3": 50.112, "r_y3": 595.076, "coord_origin": "TOPLEFT"}, "text": "generate a highly diverse dataset to train our models and", "orig": "generate a highly diverse dataset to train our models and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 615.583, "r_x1": 286.365, "r_y1": 615.583, "r_x2": 286.365, "r_y2": 607.031, "r_x3": 50.112, "r_y3": 607.031, "coord_origin": "TOPLEFT"}, "text": "then evaluate their performance on other synthetic datasets", "orig": "then evaluate their performance on other synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 627.538, "r_x1": 209.753, "r_y1": 627.538, "r_x2": 209.753, "r_y2": 618.986, "r_x3": 50.112, "r_y3": 618.986, "coord_origin": "TOPLEFT"}, "text": "which are focused on a specific domain.", "orig": "which are focused on a specific domain.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 641.335, "r_x1": 286.365, "r_y1": 641.335, "r_x2": 286.365, "r_y2": 632.783, "r_x3": 62.067, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "In this regard, we have prepared four synthetic datasets,", "orig": "In this regard, we have prepared four synthetic datasets,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 653.29, "r_x1": 286.365, "r_y1": 653.29, "r_x2": 286.365, "r_y2": 644.738, "r_x3": 50.112, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "each one containing 150k examples. The corpora to gener-", "orig": "each one containing 150k examples. The corpora to gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 665.246, "r_x1": 286.365, "r_y1": 665.246, "r_x2": 286.365, "r_y2": 656.694, "r_x3": 50.112, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "ate the table text consists of the most frequent terms appear-", "orig": "ate the table text consists of the most frequent terms appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.201, "r_x1": 286.365, "r_y1": 677.201, "r_x2": 286.365, "r_y2": 668.649, "r_x3": 50.112, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "ing in PubTabNet and FinTabNet together with randomly", "orig": "ing in PubTabNet and FinTabNet together with randomly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 109.519, "r_y1": 689.156, "r_x2": 109.519, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "generated text.", "orig": "generated text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 115.337, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 115.337, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "The first two synthetic datasets have been", "orig": "The first two synthetic datasets have been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "fine-tuned to mimic the appearance of the original datasets", "orig": "fine-tuned to mimic the appearance of the original datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "but encompass more complicated table structures. The third", "orig": "but encompass more complicated table structures. The third", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.332, "r_y0": 82.43499999999995, "r_x1": 430.902, "r_y1": 82.43499999999995, "r_x2": 430.902, "r_y2": 73.88300000000004, "r_x3": 412.332, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.857, "r_y0": 82.43499999999995, "r_x1": 464.446, "r_y1": 82.43499999999995, "r_x2": 464.446, "r_y2": 73.88300000000004, "r_x3": 442.857, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.786, "r_y0": 82.43499999999995, "r_x1": 494.942, "r_y1": 82.43499999999995, "r_x2": 494.942, "r_y2": 73.88300000000004, "r_x3": 477.786, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 508.282, "r_y0": 82.43499999999995, "r_x1": 536.914, "r_y1": 82.43499999999995, "r_x2": 536.914, "r_y2": 73.88300000000004, "r_x3": 508.282, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 94.78800000000001, "r_x1": 361.643, "r_y1": 94.78800000000001, "r_x2": 361.643, "r_y2": 86.23599999999999, "r_x3": 317.06, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 92.72199999999998, "r_x1": 425.378, "r_y1": 92.72199999999998, "r_x2": 425.378, "r_y2": 85.668, "r_x3": 417.856, "r_y3": 85.668, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 92.72199999999998, "r_x1": 457.417, "r_y1": 92.72199999999998, "r_x2": 457.417, "r_y2": 85.668, "r_x3": 449.896, "r_y3": 85.668, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 94.78800000000001, "r_x1": 496.326, "r_y1": 94.78800000000001, "r_x2": 496.326, "r_y2": 86.23599999999999, "r_x3": 476.401, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 94.78800000000001, "r_x1": 532.56, "r_y1": 94.78800000000001, "r_x2": 532.56, "r_y2": 86.23599999999999, "r_x3": 512.635, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 106.74300000000005, "r_x1": 359.431, "r_y1": 106.74300000000005, "r_x2": 359.431, "r_y2": 98.19100000000003, "r_x3": 317.06, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 104.67700000000002, "r_x1": 425.378, "r_y1": 104.67700000000002, "r_x2": 425.378, "r_y2": 97.62300000000005, "r_x3": 417.856, "r_y3": 97.62300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 104.67700000000002, "r_x1": 457.417, "r_y1": 104.67700000000002, "r_x2": 457.417, "r_y2": 97.62300000000005, "r_x3": 449.896, "r_y3": 97.62300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 106.74300000000005, "r_x1": 496.326, "r_y1": 106.74300000000005, "r_x2": 496.326, "r_y2": 98.19100000000003, "r_x3": 476.401, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.462, "r_y0": 106.74300000000005, "r_x1": 531.733, "r_y1": 106.74300000000005, "r_x2": 531.733, "r_y2": 98.19100000000003, "r_x3": 513.462, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 118.69899999999996, "r_x1": 359.979, "r_y1": 118.69899999999996, "r_x2": 359.979, "r_y2": 110.14700000000005, "r_x3": 317.06, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 116.63300000000004, "r_x1": 425.378, "r_y1": 116.63300000000004, "r_x2": 425.378, "r_y2": 109.57899999999995, "r_x3": 417.856, "r_y3": 109.57899999999995, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.812, "r_y0": 116.63300000000004, "r_x1": 456.501, "r_y1": 116.63300000000004, "r_x2": 456.501, "r_y2": 109.57899999999995, "r_x3": 450.812, "r_y3": 109.57899999999995, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 118.69899999999996, "r_x1": 496.326, "r_y1": 118.69899999999996, "r_x2": 496.326, "r_y2": 110.14700000000005, "r_x3": 476.401, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 511.25, "r_y0": 118.69899999999996, "r_x1": 533.945, "r_y1": 118.69899999999996, "r_x2": 533.945, "r_y2": 110.14700000000005, "r_x3": 511.25, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 130.654, "r_x1": 400.377, "r_y1": 130.654, "r_x2": 400.377, "r_y2": 122.10199999999998, "r_x3": 317.06, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 128.58799999999997, "r_x1": 425.378, "r_y1": 128.58799999999997, "r_x2": 425.378, "r_y2": 121.53399999999999, "r_x3": 417.856, "r_y3": 121.53399999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 128.58799999999997, "r_x1": 457.417, "r_y1": 128.58799999999997, "r_x2": 457.417, "r_y2": 121.53399999999999, "r_x3": 449.896, "r_y3": 121.53399999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 130.654, "r_x1": 496.326, "r_y1": 130.654, "r_x2": 496.326, "r_y2": 122.10199999999998, "r_x3": 476.401, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 130.654, "r_x1": 532.56, "r_y1": 130.654, "r_x2": 532.56, "r_y2": 122.10199999999998, "r_x3": 512.635, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 142.60900000000004, "r_x1": 375.172, "r_y1": 142.60900000000004, "r_x2": 375.172, "r_y2": 134.05700000000002, "r_x3": 317.06, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 140.543, "r_x1": 425.378, "r_y1": 140.543, "r_x2": 425.378, "r_y2": 133.48900000000003, "r_x3": 417.856, "r_y3": 133.48900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 140.543, "r_x1": 457.417, "r_y1": 140.543, "r_x2": 457.417, "r_y2": 133.48900000000003, "r_x3": 449.896, "r_y3": 133.48900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 142.60900000000004, "r_x1": 496.326, "r_y1": 142.60900000000004, "r_x2": 496.326, "r_y2": 134.05700000000002, "r_x3": 476.401, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 142.60900000000004, "r_x1": 532.56, "r_y1": 142.60900000000004, "r_x2": 532.56, "r_y2": 134.05700000000002, "r_x3": 512.635, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 154.56399999999996, "r_x1": 369.394, "r_y1": 154.56399999999996, "r_x2": 369.394, "r_y2": 146.01199999999994, "r_x3": 317.06, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 152.49800000000005, "r_x1": 425.378, "r_y1": 152.49800000000005, "r_x2": 425.378, "r_y2": 145.44399999999996, "r_x3": 417.856, "r_y3": 145.44399999999996, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 152.49800000000005, "r_x1": 457.417, "r_y1": 152.49800000000005, "r_x2": 457.417, "r_y2": 145.44399999999996, "r_x3": 449.896, "r_y3": 145.44399999999996, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 154.56399999999996, "r_x1": 496.326, "r_y1": 154.56399999999996, "r_x2": 496.326, "r_y2": 146.01199999999994, "r_x3": 476.401, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 154.56399999999996, "r_x1": 532.56, "r_y1": 154.56399999999996, "r_x2": 532.56, "r_y2": 146.01199999999994, "r_x3": 512.635, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 176.48199999999997, "r_x1": 330.75, "r_y1": 176.48199999999997, "r_x2": 330.75, "r_y2": 167.92999999999995, "r_x3": 308.862, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 336.867, "r_y0": 176.48199999999997, "r_x1": 344.618, "r_y1": 176.48199999999997, "r_x2": 344.618, "r_y2": 167.92999999999995, "r_x3": 336.867, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "1:", "orig": "1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 361.076, "r_y0": 176.48199999999997, "r_x1": 380.453, "r_y1": 176.48199999999997, "r_x2": 380.453, "r_y2": 167.92999999999995, "r_x3": 361.076, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "Both", "orig": "Both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.568, "r_y0": 176.33900000000006, "r_x1": 468.68, "r_y1": 176.33900000000006, "r_x2": 468.68, "r_y2": 167.75099999999998, "r_x3": 386.568, "r_y3": 167.75099999999998, "coord_origin": "TOPLEFT"}, "text": "'Combined-Tabnet'", "orig": "'Combined-Tabnet'", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 474.796, "r_y0": 176.48199999999997, "r_x1": 489.182, "r_y1": 176.48199999999997, "r_x2": 489.182, "r_y2": 167.92999999999995, "r_x3": 474.796, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 495.299, "r_y0": 176.33900000000006, "r_x1": 545.112, "r_y1": 176.33900000000006, "r_x2": 545.112, "r_y2": 167.75099999999998, "r_x3": 495.299, "r_y3": 167.75099999999998, "coord_origin": "TOPLEFT"}, "text": "'Combined-", "orig": "'Combined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 188.29399999999998, "r_x1": 341.161, "r_y1": 188.29399999999998, "r_x2": 341.161, "r_y2": 179.70600000000002, "r_x3": 308.862, "r_y3": 179.70600000000002, "coord_origin": "TOPLEFT"}, "text": "Tabnet'", "orig": "Tabnet'", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 343.457, "r_y0": 188.437, "r_x1": 545.11, "r_y1": 188.437, "r_x2": 545.11, "r_y2": 179.885, "r_x3": 343.457, "r_y3": 179.885, "coord_origin": "TOPLEFT"}, "text": "are variations of the following: (*) The Combined-", "orig": "are variations of the following: (*) The Combined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 200.39200000000005, "r_x1": 545.115, "r_y1": 200.39200000000005, "r_x2": 545.115, "r_y2": 191.84000000000003, "r_x3": 308.862, "r_y3": 191.84000000000003, "coord_origin": "TOPLEFT"}, "text": "Tabnet dataset is the processed combination of PubTabNet", "orig": "Tabnet dataset is the processed combination of PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 212.34699999999998, "r_x1": 366.276, "r_y1": 212.34699999999998, "r_x2": 366.276, "r_y2": 203.79499999999996, "r_x3": 308.862, "r_y3": 203.79499999999996, "coord_origin": "TOPLEFT"}, "text": "and Fintabnet.", "orig": "and Fintabnet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 370.58, "r_y0": 212.34699999999998, "r_x1": 545.115, "r_y1": 212.34699999999998, "r_x2": 545.115, "r_y2": 203.79499999999996, "r_x3": 370.58, "r_y3": 203.79499999999996, "coord_origin": "TOPLEFT"}, "text": "(**) The combined dataset is the processed", "orig": "(**) The combined dataset is the processed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 224.303, "r_x1": 523.935, "r_y1": 224.303, "r_x2": 523.935, "r_y2": 215.75099999999998, "r_x3": 308.862, "r_y3": 215.75099999999998, "coord_origin": "TOPLEFT"}, "text": "combination of PubTabNet, Fintabnet and TableBank.", "orig": "combination of PubTabNet, Fintabnet and TableBank.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.44100000000003, "r_x1": 545.115, "r_y1": 258.44100000000003, "r_x2": 545.115, "r_y2": 249.889, "r_x3": 308.862, "r_y3": 249.889, "coord_origin": "TOPLEFT"}, "text": "one adopts a colorful appearance with high contrast and the", "orig": "one adopts a colorful appearance with high contrast and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 270.39599999999996, "r_x1": 545.115, "r_y1": 270.39599999999996, "r_x2": 545.115, "r_y2": 261.84400000000005, "r_x3": 308.862, "r_y3": 261.84400000000005, "coord_origin": "TOPLEFT"}, "text": "last one contains tables with sparse content. Lastly, we have", "orig": "last one contains tables with sparse content. Lastly, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 282.351, "r_x1": 545.115, "r_y1": 282.351, "r_x2": 545.115, "r_y2": 273.799, "r_x3": 308.862, "r_y3": 273.799, "coord_origin": "TOPLEFT"}, "text": "combined all synthetic datasets into one big unified syn-", "orig": "combined all synthetic datasets into one big unified syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 294.306, "r_x1": 436.822, "r_y1": 294.306, "r_x2": 436.822, "r_y2": 285.754, "r_x3": 308.862, "r_y3": 285.754, "coord_origin": "TOPLEFT"}, "text": "thetic dataset of 600k examples.", "orig": "thetic dataset of 600k examples.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 306.593, "r_x1": 542.744, "r_y1": 306.593, "r_x2": 542.744, "r_y2": 298.041, "r_x3": 320.817, "r_y3": 298.041, "coord_origin": "TOPLEFT"}, "text": "Tab. 1 summarizes the various attributes of the datasets.", "orig": "Tab. 1 summarizes the various attributes of the datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 331.932, "r_x1": 444.936, "r_y1": 331.932, "r_x2": 444.936, "r_y2": 321.184, "r_x3": 308.862, "r_y3": 321.184, "coord_origin": "TOPLEFT"}, "text": "4. The TableFormer model", "orig": "4. The TableFormer model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 350.76, "r_x1": 545.115, "r_y1": 350.76, "r_x2": 545.115, "r_y2": 342.208, "r_x3": 320.817, "r_y3": 342.208, "coord_origin": "TOPLEFT"}, "text": "Given the image of a table, TableFormer is able to pre-", "orig": "Given the image of a table, TableFormer is able to pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 362.715, "r_x1": 326.576, "r_y1": 362.715, "r_x2": 326.576, "r_y2": 354.163, "r_x3": 308.862, "r_y3": 354.163, "coord_origin": "TOPLEFT"}, "text": "dict:", "orig": "dict:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.172, "r_y0": 362.715, "r_x1": 545.115, "r_y1": 362.715, "r_x2": 545.115, "r_y2": 354.163, "r_x3": 330.172, "r_y3": 354.163, "coord_origin": "TOPLEFT"}, "text": "1) a sequence of tokens that represent the structure of", "orig": "1) a sequence of tokens that represent the structure of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 374.67, "r_x1": 545.115, "r_y1": 374.67, "r_x2": 545.115, "r_y2": 366.118, "r_x3": 308.862, "r_y3": 366.118, "coord_origin": "TOPLEFT"}, "text": "a table, and 2) a bounding box coupled to a subset of those", "orig": "a table, and 2) a bounding box coupled to a subset of those", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 386.625, "r_x1": 337.265, "r_y1": 386.625, "r_x2": 337.265, "r_y2": 378.073, "r_x3": 308.862, "r_y3": 378.073, "coord_origin": "TOPLEFT"}, "text": "tokens.", "orig": "tokens.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.808, "r_y0": 386.625, "r_x1": 545.115, "r_y1": 386.625, "r_x2": 545.115, "r_y2": 378.073, "r_x3": 341.808, "r_y3": 378.073, "coord_origin": "TOPLEFT"}, "text": "The conversion of an image into a sequence of to-", "orig": "The conversion of an image into a sequence of to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 398.58, "r_x1": 545.115, "r_y1": 398.58, "r_x2": 545.115, "r_y2": 390.028, "r_x3": 308.862, "r_y3": 390.028, "coord_origin": "TOPLEFT"}, "text": "kens is a well-known task [35, 16]. While attention is often", "orig": "kens is a well-known task [35, 16]. While attention is often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 410.535, "r_x1": 545.115, "r_y1": 410.535, "r_x2": 545.115, "r_y2": 401.983, "r_x3": 308.862, "r_y3": 401.983, "coord_origin": "TOPLEFT"}, "text": "used as an implicit method to associate each token of the", "orig": "used as an implicit method to associate each token of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 422.491, "r_x1": 545.115, "r_y1": 422.491, "r_x2": 545.115, "r_y2": 413.939, "r_x3": 308.862, "r_y3": 413.939, "coord_origin": "TOPLEFT"}, "text": "sequence with a position in the original image, an explicit", "orig": "sequence with a position in the original image, an explicit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 434.446, "r_x1": 545.115, "r_y1": 434.446, "r_x2": 545.115, "r_y2": 425.894, "r_x3": 308.862, "r_y3": 425.894, "coord_origin": "TOPLEFT"}, "text": "association between the individual table-cells and the image", "orig": "association between the individual table-cells and the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 446.401, "r_x1": 437.937, "r_y1": 446.401, "r_x2": 437.937, "r_y2": 437.849, "r_x3": 308.862, "r_y3": 437.849, "coord_origin": "TOPLEFT"}, "text": "bounding boxes is also required.", "orig": "bounding boxes is also required.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 467.546, "r_x1": 420.161, "r_y1": 467.546, "r_x2": 420.161, "r_y2": 457.694, "r_x3": 308.862, "r_y3": 457.694, "coord_origin": "TOPLEFT"}, "text": "4.1. Model architecture.", "orig": "4.1. Model architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 485.586, "r_x1": 545.115, "r_y1": 485.586, "r_x2": 545.115, "r_y2": 477.034, "r_x3": 320.817, "r_y3": 477.034, "coord_origin": "TOPLEFT"}, "text": "We now describe in detail the proposed method, which", "orig": "We now describe in detail the proposed method, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 497.541, "r_x1": 315.507, "r_y1": 497.541, "r_x2": 315.507, "r_y2": 488.989, "r_x3": 308.862, "r_y3": 488.989, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 319.153, "r_y0": 497.541, "r_x1": 509.021, "r_y1": 497.541, "r_x2": 509.021, "r_y2": 488.989, "r_x3": 319.153, "r_y3": 488.989, "coord_origin": "TOPLEFT"}, "text": "composed of three main components, see Fig.", "orig": "composed of three main components, see Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.586, "r_y0": 497.541, "r_x1": 523.058, "r_y1": 497.541, "r_x2": 523.058, "r_y2": 488.989, "r_x3": 515.586, "r_y3": 488.989, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 529.623, "r_y0": 497.541, "r_x1": 545.115, "r_y1": 497.541, "r_x2": 545.115, "r_y2": 488.989, "r_x3": 529.623, "r_y3": 488.989, "coord_origin": "TOPLEFT"}, "text": "Our", "orig": "Our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 509.353, "r_x1": 406.346, "r_y1": 509.353, "r_x2": 406.346, "r_y2": 500.765, "r_x3": 308.862, "r_y3": 500.765, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.872, "r_y0": 509.496, "r_x1": 545.111, "r_y1": 509.496, "r_x2": 545.111, "r_y2": 500.944, "r_x3": 408.872, "r_y3": 500.944, "coord_origin": "TOPLEFT"}, "text": "encodes the input as a feature vec-", "orig": "encodes the input as a feature vec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 521.452, "r_x1": 319.93, "r_y1": 521.452, "r_x2": 319.93, "r_y2": 512.9, "r_x3": 308.862, "r_y3": 512.9, "coord_origin": "TOPLEFT"}, "text": "tor", "orig": "tor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.836, "r_y0": 521.452, "r_x1": 409.395, "r_y1": 521.452, "r_x2": 409.395, "r_y2": 512.9, "r_x3": 323.836, "r_y3": 512.9, "coord_origin": "TOPLEFT"}, "text": "of predefined length.", "orig": "of predefined length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.727, "r_y0": 521.452, "r_x1": 545.115, "r_y1": 521.452, "r_x2": 545.115, "r_y2": 512.9, "r_x3": 416.727, "r_y3": 512.9, "coord_origin": "TOPLEFT"}, "text": "The input feature vector of the", "orig": "The input feature vector of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.4069999999999, "r_x1": 436.194, "r_y1": 533.4069999999999, "r_x2": 436.194, "r_y2": 524.855, "r_x3": 308.862, "r_y3": 524.855, "coord_origin": "TOPLEFT"}, "text": "encoded image is passed to the", "orig": "encoded image is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.526, "r_y0": 533.264, "r_x1": 513.867, "r_y1": 533.264, "r_x2": 513.867, "r_y2": 524.6759999999999, "r_x3": 439.526, "r_y3": 524.6759999999999, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 517.432, "r_y0": 533.4069999999999, "r_x1": 545.108, "r_y1": 533.4069999999999, "r_x2": 545.108, "r_y2": 524.855, "r_x3": 517.432, "r_y3": 524.855, "coord_origin": "TOPLEFT"}, "text": "to pro-", "orig": "to pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.362, "r_x1": 545.115, "r_y1": 545.362, "r_x2": 545.115, "r_y2": 536.81, "r_x3": 308.862, "r_y3": 536.81, "coord_origin": "TOPLEFT"}, "text": "duce a sequence of HTML tags that represent the structure", "orig": "duce a sequence of HTML tags that represent the structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 557.317, "r_x1": 358.545, "r_y1": 557.317, "r_x2": 358.545, "r_y2": 548.765, "r_x3": 308.862, "r_y3": 548.765, "coord_origin": "TOPLEFT"}, "text": "of the table.", "orig": "of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.191, "r_y0": 557.317, "r_x1": 545.115, "r_y1": 557.317, "r_x2": 545.115, "r_y2": 548.765, "r_x3": 365.191, "r_y3": 548.765, "coord_origin": "TOPLEFT"}, "text": "With each prediction of an HTML standard", "orig": "With each prediction of an HTML standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.2719999999999, "r_x1": 352.409, "r_y1": 569.2719999999999, "r_x2": 352.409, "r_y2": 560.72, "r_x3": 308.862, "r_y3": 560.72, "coord_origin": "TOPLEFT"}, "text": "data cell ('", "orig": "data cell ('", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 352.409, "r_y0": 569.108, "r_x1": 360.158, "r_y1": 569.108, "r_x2": 360.158, "r_y2": 560.402, "r_x3": 352.409, "r_y3": 560.402, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.158, "r_y0": 569.2719999999999, "r_x1": 367.909, "r_y1": 569.2719999999999, "r_x2": 367.909, "r_y2": 560.72, "r_x3": 360.158, "r_y3": 560.72, "coord_origin": "TOPLEFT"}, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.909, "r_y0": 569.108, "r_x1": 375.658, "r_y1": 569.108, "r_x2": 375.658, "r_y2": 560.402, "r_x3": 367.909, "r_y3": 560.402, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.658, "r_y0": 569.2719999999999, "r_x1": 545.112, "r_y1": 569.2719999999999, "r_x2": 545.112, "r_y2": 560.72, "r_x3": 375.658, "r_y3": 560.72, "coord_origin": "TOPLEFT"}, "text": "') the hidden state of that cell is passed to", "orig": "') the hidden state of that cell is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 581.2280000000001, "r_x1": 545.115, "r_y1": 581.2280000000001, "r_x2": 545.115, "r_y2": 572.6759999999999, "r_x3": 308.862, "r_y3": 572.6759999999999, "coord_origin": "TOPLEFT"}, "text": "the Cell BBox Decoder. As for spanning cells, such as row", "orig": "the Cell BBox Decoder. As for spanning cells, such as row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 593.183, "r_x1": 483.118, "r_y1": 593.183, "r_x2": 483.118, "r_y2": 584.631, "r_x3": 308.862, "r_y3": 584.631, "coord_origin": "TOPLEFT"}, "text": "or column span, the tag is broken down to '", "orig": "or column span, the tag is broken down to '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.119, "r_y0": 593.019, "r_x1": 490.868, "r_y1": 593.019, "r_x2": 490.868, "r_y2": 584.313, "r_x3": 483.119, "r_y3": 584.313, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.868, "r_y0": 593.183, "r_x1": 545.114, "r_y1": 593.183, "r_x2": 545.114, "r_y2": 584.631, "r_x3": 490.868, "r_y3": 584.631, "coord_origin": "TOPLEFT"}, "text": "', 'rowspan='", "orig": "', 'rowspan='", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.138, "r_x1": 545.115, "r_y1": 605.138, "r_x2": 545.115, "r_y2": 596.586, "r_x3": 308.862, "r_y3": 596.586, "coord_origin": "TOPLEFT"}, "text": "or 'colspan=', with the number of spanning cells (attribute),", "orig": "or 'colspan=', with the number of spanning cells (attribute),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.093, "r_x1": 329.644, "r_y1": 617.093, "r_x2": 329.644, "r_y2": 608.5409999999999, "r_x3": 308.862, "r_y3": 608.5409999999999, "coord_origin": "TOPLEFT"}, "text": "and '", "orig": "and '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 329.646, "r_y0": 616.929, "r_x1": 337.395, "r_y1": 616.929, "r_x2": 337.395, "r_y2": 608.223, "r_x3": 329.646, "r_y3": 608.223, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.394, "r_y0": 617.093, "r_x1": 343.202, "r_y1": 617.093, "r_x2": 343.202, "r_y2": 608.5409999999999, "r_x3": 337.394, "r_y3": 608.5409999999999, "coord_origin": "TOPLEFT"}, "text": "'.", "orig": "'.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.064, "r_y0": 617.093, "r_x1": 468.591, "r_y1": 617.093, "r_x2": 468.591, "r_y2": 608.5409999999999, "r_x3": 348.064, "r_y3": 608.5409999999999, "coord_origin": "TOPLEFT"}, "text": "The hidden state attached to '", "orig": "The hidden state attached to '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.595, "r_y0": 616.929, "r_x1": 476.344, "r_y1": 616.929, "r_x2": 476.344, "r_y2": 608.223, "r_x3": 468.595, "r_y3": 608.223, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.344, "r_y0": 617.093, "r_x1": 545.116, "r_y1": 617.093, "r_x2": 545.116, "r_y2": 608.5409999999999, "r_x3": 476.344, "r_y3": 608.5409999999999, "coord_origin": "TOPLEFT"}, "text": "' is passed to the", "orig": "' is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.048, "r_x1": 545.115, "r_y1": 629.048, "r_x2": 545.115, "r_y2": 620.496, "r_x3": 308.862, "r_y3": 620.496, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder. A shared feed forward network (FFN)", "orig": "Cell BBox Decoder. A shared feed forward network (FFN)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.0029999999999, "r_x1": 533.2, "r_y1": 641.0029999999999, "r_x2": 533.2, "r_y2": 632.451, "r_x3": 308.862, "r_y3": 632.451, "coord_origin": "TOPLEFT"}, "text": "receives the hidden states from the Structure Decoder,", "orig": "receives the hidden states from the Structure Decoder,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 537.364, "r_y0": 641.0029999999999, "r_x1": 545.115, "r_y1": 641.0029999999999, "r_x2": 545.115, "r_y2": 632.451, "r_x3": 537.364, "r_y3": 632.451, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 652.9590000000001, "r_x1": 545.115, "r_y1": 652.9590000000001, "r_x2": 545.115, "r_y2": 644.407, "r_x3": 308.862, "r_y3": 644.407, "coord_origin": "TOPLEFT"}, "text": "provide the final detection predictions of the bounding box", "orig": "provide the final detection predictions of the bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 664.914, "r_x1": 449.424, "r_y1": 664.914, "r_x2": 449.424, "r_y2": 656.362, "r_x3": 308.862, "r_y3": 656.362, "coord_origin": "TOPLEFT"}, "text": "coordinates and their classification.", "orig": "coordinates and their classification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 677.217, "r_x1": 431.91, "r_y1": 677.217, "r_x2": 431.91, "r_y2": 668.261, "r_x3": 320.817, "r_y3": 668.261, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network.", "orig": "CNN Backbone Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.499, "r_y0": 677.201, "r_x1": 545.113, "r_y1": 677.201, "r_x2": 545.113, "r_y2": 668.649, "r_x3": 439.499, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "A ResNet-18 CNN is the", "orig": "A ResNet-18 CNN is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 308.862, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "backbone that receives the table image and encodes it as a", "orig": "backbone that receives the table image and encodes it as a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "vector of predefined length. The network has been modified", "orig": "vector of predefined length. The network has been modified", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "by removing the linear and pooling layer, as we are not per-", "orig": "by removing the linear and pooling layer, as we are not per-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 10, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 286.365, "b": 95.98400000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9611433148384094, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "amount of such tables, and kept only those ones ranging", "orig": "amount of such tables, and kept only those ones ranging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 95.98400000000004, "r_x1": 212.283, "r_y1": 95.98400000000004, "r_x2": 212.283, "r_y2": 87.43200000000002, "r_x3": 50.112, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "between 1*1 and 20*10 (rows/columns).", "orig": "between 1*1 and 20*10 (rows/columns).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 50.112, "t": 101.22900000000004, "r": 286.365, "b": 313.019, "coord_origin": "TOPLEFT"}, "confidence": 0.988013744354248, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 109.78099999999995, "r_x1": 286.365, "r_y1": 109.78099999999995, "r_x2": 286.365, "r_y2": 101.22900000000004, "r_x3": 62.067, "r_y3": 101.22900000000004, "coord_origin": "TOPLEFT"}, "text": "The availability of the bounding boxes for all table cells", "orig": "The availability of the bounding boxes for all table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 121.73599999999999, "r_x1": 176.458, "r_y1": 121.73599999999999, "r_x2": 176.458, "r_y2": 113.18399999999997, "r_x3": 50.112, "r_y3": 113.18399999999997, "coord_origin": "TOPLEFT"}, "text": "is essential to train our models.", "orig": "is essential to train our models.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.971, "r_y0": 121.73599999999999, "r_x1": 286.365, "r_y1": 121.73599999999999, "r_x2": 286.365, "r_y2": 113.18399999999997, "r_x3": 180.971, "r_y3": 113.18399999999997, "coord_origin": "TOPLEFT"}, "text": "In order to distinguish be-", "orig": "In order to distinguish be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 133.69100000000003, "r_x1": 286.365, "r_y1": 133.69100000000003, "r_x2": 286.365, "r_y2": 125.13900000000001, "r_x3": 50.112, "r_y3": 125.13900000000001, "coord_origin": "TOPLEFT"}, "text": "tween empty and non-empty bounding boxes, we have in-", "orig": "tween empty and non-empty bounding boxes, we have in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 145.64700000000005, "r_x1": 286.365, "r_y1": 145.64700000000005, "r_x2": 286.365, "r_y2": 137.09500000000003, "r_x3": 50.112, "r_y3": 137.09500000000003, "coord_origin": "TOPLEFT"}, "text": "troduced a binary class in the annotation. Unfortunately, the", "orig": "troduced a binary class in the annotation. Unfortunately, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 157.60199999999998, "r_x1": 286.365, "r_y1": 157.60199999999998, "r_x2": 286.365, "r_y2": 149.04999999999995, "r_x3": 50.112, "r_y3": 149.04999999999995, "coord_origin": "TOPLEFT"}, "text": "original datasets either omit the bounding boxes for whole", "orig": "original datasets either omit the bounding boxes for whole", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 169.55700000000002, "r_x1": 94.127, "r_y1": 169.55700000000002, "r_x2": 94.127, "r_y2": 161.005, "r_x3": 50.112, "r_y3": 161.005, "coord_origin": "TOPLEFT"}, "text": "tables (e.g.", "orig": "tables (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 98.959, "r_y0": 169.55700000000002, "r_x1": 286.365, "r_y1": 169.55700000000002, "r_x2": 286.365, "r_y2": 161.005, "r_x3": 98.959, "r_y3": 161.005, "coord_origin": "TOPLEFT"}, "text": "TableBank) or they narrow their scope only to", "orig": "TableBank) or they narrow their scope only to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 181.51199999999994, "r_x1": 116.951, "r_y1": 181.51199999999994, "r_x2": 116.951, "r_y2": 172.96000000000004, "r_x3": 50.112, "r_y3": 172.96000000000004, "coord_origin": "TOPLEFT"}, "text": "non-empty cells.", "orig": "non-empty cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 121.345, "r_y0": 181.51199999999994, "r_x1": 286.365, "r_y1": 181.51199999999994, "r_x2": 286.365, "r_y2": 172.96000000000004, "r_x3": 121.345, "r_y3": 172.96000000000004, "coord_origin": "TOPLEFT"}, "text": "Therefore, it was imperative to introduce", "orig": "Therefore, it was imperative to introduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 193.46699999999998, "r_x1": 286.365, "r_y1": 193.46699999999998, "r_x2": 286.365, "r_y2": 184.91499999999996, "r_x3": 50.112, "r_y3": 184.91499999999996, "coord_origin": "TOPLEFT"}, "text": "a data pre-processing procedure that generates the missing", "orig": "a data pre-processing procedure that generates the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 205.423, "r_x1": 286.365, "r_y1": 205.423, "r_x2": 286.365, "r_y2": 196.87099999999998, "r_x3": 50.112, "r_y3": 196.87099999999998, "coord_origin": "TOPLEFT"}, "text": "bounding boxes out of the annotation information. This pro-", "orig": "bounding boxes out of the annotation information. This pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 217.37800000000004, "r_x1": 286.365, "r_y1": 217.37800000000004, "r_x2": 286.365, "r_y2": 208.82600000000002, "r_x3": 50.112, "r_y3": 208.82600000000002, "coord_origin": "TOPLEFT"}, "text": "cedure first parses the provided table structure and calcu-", "orig": "cedure first parses the provided table structure and calcu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 229.33299999999997, "r_x1": 286.365, "r_y1": 229.33299999999997, "r_x2": 286.365, "r_y2": 220.78099999999995, "r_x3": 50.112, "r_y3": 220.78099999999995, "coord_origin": "TOPLEFT"}, "text": "lates the dimensions of the most fine-grained grid that cov-", "orig": "lates the dimensions of the most fine-grained grid that cov-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 241.288, "r_x1": 139.805, "r_y1": 241.288, "r_x2": 139.805, "r_y2": 232.736, "r_x3": 50.112, "r_y3": 232.736, "coord_origin": "TOPLEFT"}, "text": "ers the table structure.", "orig": "ers the table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 144.607, "r_y0": 241.288, "r_x1": 286.365, "r_y1": 241.288, "r_x2": 286.365, "r_y2": 232.736, "r_x3": 144.607, "r_y3": 232.736, "coord_origin": "TOPLEFT"}, "text": "Notice that each table cell may oc-", "orig": "Notice that each table cell may oc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 253.24300000000005, "r_x1": 286.365, "r_y1": 253.24300000000005, "r_x2": 286.365, "r_y2": 244.69100000000003, "r_x3": 50.112, "r_y3": 244.69100000000003, "coord_origin": "TOPLEFT"}, "text": "cupy multiple grid squares due to row or column spans. In", "orig": "cupy multiple grid squares due to row or column spans. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 265.198, "r_x1": 286.365, "r_y1": 265.198, "r_x2": 286.365, "r_y2": 256.64599999999996, "r_x3": 50.112, "r_y3": 256.64599999999996, "coord_origin": "TOPLEFT"}, "text": "case of PubTabNet we had to compute missing bounding", "orig": "case of PubTabNet we had to compute missing bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 277.154, "r_x1": 286.365, "r_y1": 277.154, "r_x2": 286.365, "r_y2": 268.602, "r_x3": 50.112, "r_y3": 268.602, "coord_origin": "TOPLEFT"}, "text": "boxes for 48% of the simple and 69% of the complex ta-", "orig": "boxes for 48% of the simple and 69% of the complex ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 289.109, "r_x1": 68.652, "r_y1": 289.109, "r_x2": 68.652, "r_y2": 280.557, "r_x3": 50.112, "r_y3": 280.557, "coord_origin": "TOPLEFT"}, "text": "bles.", "orig": "bles.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 75.566, "r_y0": 289.109, "r_x1": 286.365, "r_y1": 289.109, "r_x2": 286.365, "r_y2": 280.557, "r_x3": 75.566, "r_y3": 280.557, "coord_origin": "TOPLEFT"}, "text": "Regarding FinTabNet, 68% of the simple and 98%", "orig": "Regarding FinTabNet, 68% of the simple and 98%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 301.064, "r_x1": 286.365, "r_y1": 301.064, "r_x2": 286.365, "r_y2": 292.512, "r_x3": 50.112, "r_y3": 292.512, "coord_origin": "TOPLEFT"}, "text": "of the complex tables require the generation of bounding", "orig": "of the complex tables require the generation of bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 313.019, "r_x1": 75.696, "r_y1": 313.019, "r_x2": 75.696, "r_y2": 304.467, "r_x3": 50.112, "r_y3": 304.467, "coord_origin": "TOPLEFT"}, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "text", "bbox": {"l": 50.112, "t": 318.264, "r": 286.365, "b": 434.413, "coord_origin": "TOPLEFT"}, "confidence": 0.9873981475830078, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 326.816, "r_x1": 286.365, "r_y1": 326.816, "r_x2": 286.365, "r_y2": 318.264, "r_x3": 62.067, "r_y3": 318.264, "coord_origin": "TOPLEFT"}, "text": "As it is illustrated in Fig. 2, the table distributions from", "orig": "As it is illustrated in Fig. 2, the table distributions from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 338.772, "r_x1": 60.075, "r_y1": 338.772, "r_x2": 60.075, "r_y2": 330.22, "r_x3": 50.112, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.146, "r_y0": 338.772, "r_x1": 96.687, "r_y1": 338.772, "r_x2": 96.687, "r_y2": 330.22, "r_x3": 65.146, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "datasets", "orig": "datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.768, "r_y0": 338.772, "r_x1": 113.932, "r_y1": 338.772, "r_x2": 113.932, "r_y2": 330.22, "r_x3": 101.768, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "are", "orig": "are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.003, "r_y0": 338.772, "r_x1": 148.533, "r_y1": 338.772, "r_x2": 148.533, "r_y2": 330.22, "r_x3": 119.003, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "skewed", "orig": "skewed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.613, "r_y0": 338.772, "r_x1": 184.806, "r_y1": 338.772, "r_x2": 184.806, "r_y2": 330.22, "r_x3": 153.613, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "towards", "orig": "towards", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 189.877, "r_y0": 338.772, "r_x1": 219.765, "r_y1": 338.772, "r_x2": 219.765, "r_y2": 330.22, "r_x3": 189.877, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "simpler", "orig": "simpler", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.836, "r_y0": 338.772, "r_x1": 263.571, "r_y1": 338.772, "r_x2": 263.571, "r_y2": 330.22, "r_x3": 224.836, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "structures", "orig": "structures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 268.652, "r_y0": 338.772, "r_x1": 286.365, "r_y1": 338.772, "r_x2": 286.365, "r_y2": 330.22, "r_x3": 268.652, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 350.727, "r_x1": 286.365, "r_y1": 350.727, "r_x2": 286.365, "r_y2": 342.175, "r_x3": 50.112, "r_y3": 342.175, "coord_origin": "TOPLEFT"}, "text": "fewer number of rows/columns. Additionally, there is very", "orig": "fewer number of rows/columns. Additionally, there is very", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 362.682, "r_x1": 286.365, "r_y1": 362.682, "r_x2": 286.365, "r_y2": 354.13, "r_x3": 50.112, "r_y3": 354.13, "coord_origin": "TOPLEFT"}, "text": "limited variance in the table styles, which in case of Pub-", "orig": "limited variance in the table styles, which in case of Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 374.637, "r_x1": 286.365, "r_y1": 374.637, "r_x2": 286.365, "r_y2": 366.085, "r_x3": 50.112, "r_y3": 366.085, "coord_origin": "TOPLEFT"}, "text": "TabNet and FinTabNet means one styling format for the", "orig": "TabNet and FinTabNet means one styling format for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 386.592, "r_x1": 141.589, "r_y1": 386.592, "r_x2": 141.589, "r_y2": 378.04, "r_x3": 50.112, "r_y3": 378.04, "coord_origin": "TOPLEFT"}, "text": "majority of the tables.", "orig": "majority of the tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.702, "r_y0": 386.592, "r_x1": 286.365, "r_y1": 386.592, "r_x2": 286.365, "r_y2": 378.04, "r_x3": 148.702, "r_y3": 378.04, "coord_origin": "TOPLEFT"}, "text": "Similar limitations appear also in", "orig": "Similar limitations appear also in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 398.547, "r_x1": 286.365, "r_y1": 398.547, "r_x2": 286.365, "r_y2": 389.995, "r_x3": 50.112, "r_y3": 389.995, "coord_origin": "TOPLEFT"}, "text": "the type of table content, which in some cases (e.g. FinTab-", "orig": "the type of table content, which in some cases (e.g. FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 410.503, "r_x1": 201.822, "r_y1": 410.503, "r_x2": 201.822, "r_y2": 401.951, "r_x3": 50.112, "r_y3": 401.951, "coord_origin": "TOPLEFT"}, "text": "Net) is restricted to a certain domain.", "orig": "Net) is restricted to a certain domain.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.764, "r_y0": 410.503, "r_x1": 286.365, "r_y1": 410.503, "r_x2": 286.365, "r_y2": 401.951, "r_x3": 206.764, "r_y3": 401.951, "coord_origin": "TOPLEFT"}, "text": "Ultimately, the lack", "orig": "Ultimately, the lack", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 422.458, "r_x1": 286.365, "r_y1": 422.458, "r_x2": 286.365, "r_y2": 413.906, "r_x3": 50.112, "r_y3": 413.906, "coord_origin": "TOPLEFT"}, "text": "of diversity in the training dataset damages the ability of the", "orig": "of diversity in the training dataset damages the ability of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 434.413, "r_x1": 216.398, "r_y1": 434.413, "r_x2": 216.398, "r_y2": 425.861, "r_x3": 50.112, "r_y3": 425.861, "coord_origin": "TOPLEFT"}, "text": "models to generalize well on unseen data.", "orig": "models to generalize well on unseen data.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 50.112, "t": 439.658, "r": 286.367, "b": 627.538, "coord_origin": "TOPLEFT"}, "confidence": 0.9876030087471008, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 448.21, "r_x1": 286.365, "r_y1": 448.21, "r_x2": 286.365, "r_y2": 439.658, "r_x3": 62.067, "r_y3": 439.658, "coord_origin": "TOPLEFT"}, "text": "Motivated by those observations we aimed at generating", "orig": "Motivated by those observations we aimed at generating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 460.165, "r_x1": 172.144, "r_y1": 460.165, "r_x2": 172.144, "r_y2": 451.613, "r_x3": 50.112, "r_y3": 451.613, "coord_origin": "TOPLEFT"}, "text": "a synthetic table dataset named", "orig": "a synthetic table dataset named", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 174.148, "r_y0": 460.022, "r_x1": 224.708, "r_y1": 460.022, "r_x2": 224.708, "r_y2": 451.434, "r_x3": 174.148, "r_y3": 451.434, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.708, "r_y0": 460.165, "r_x1": 227.199, "r_y1": 460.165, "r_x2": 227.199, "r_y2": 451.613, "r_x3": 224.708, "r_y3": 451.613, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 230.128, "r_y0": 460.165, "r_x1": 286.367, "r_y1": 460.165, "r_x2": 286.367, "r_y2": 451.613, "r_x3": 230.128, "r_y3": 451.613, "coord_origin": "TOPLEFT"}, "text": "This approach", "orig": "This approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 472.121, "r_x1": 128.179, "r_y1": 472.121, "r_x2": 128.179, "r_y2": 463.569, "r_x3": 50.112, "r_y3": 463.569, "coord_origin": "TOPLEFT"}, "text": "offers control over:", "orig": "offers control over:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.971, "r_y0": 472.121, "r_x1": 286.365, "r_y1": 472.121, "r_x2": 286.365, "r_y2": 463.569, "r_x3": 132.971, "r_y3": 463.569, "coord_origin": "TOPLEFT"}, "text": "1) the size of the dataset, 2) the table", "orig": "1) the size of the dataset, 2) the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 484.076, "r_x1": 266.739, "r_y1": 484.076, "r_x2": 266.739, "r_y2": 475.524, "r_x3": 50.112, "r_y3": 475.524, "coord_origin": "TOPLEFT"}, "text": "structure, 3) the table style and 4) the type of content.", "orig": "structure, 3) the table style and 4) the type of content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.873, "r_y0": 484.076, "r_x1": 286.365, "r_y1": 484.076, "r_x2": 286.365, "r_y2": 475.524, "r_x3": 270.873, "r_y3": 475.524, "coord_origin": "TOPLEFT"}, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 496.031, "r_x1": 286.365, "r_y1": 496.031, "r_x2": 286.365, "r_y2": 487.479, "r_x3": 50.112, "r_y3": 487.479, "coord_origin": "TOPLEFT"}, "text": "complexity of the table structure is described by the size of", "orig": "complexity of the table structure is described by the size of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 507.986, "r_x1": 286.365, "r_y1": 507.986, "r_x2": 286.365, "r_y2": 499.434, "r_x3": 50.112, "r_y3": 499.434, "coord_origin": "TOPLEFT"}, "text": "the table header and the table body, as well as the percentage", "orig": "the table header and the table body, as well as the percentage", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 519.941, "r_x1": 286.365, "r_y1": 519.941, "r_x2": 286.365, "r_y2": 511.389, "r_x3": 50.112, "r_y3": 511.389, "coord_origin": "TOPLEFT"}, "text": "of the table cells covered by row spans and column spans.", "orig": "of the table cells covered by row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 531.8969999999999, "r_x1": 286.365, "r_y1": 531.8969999999999, "r_x2": 286.365, "r_y2": 523.345, "r_x3": 50.112, "r_y3": 523.345, "coord_origin": "TOPLEFT"}, "text": "A set of carefully designed styling templates provides the", "orig": "A set of carefully designed styling templates provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 543.852, "r_x1": 286.365, "r_y1": 543.852, "r_x2": 286.365, "r_y2": 535.3, "r_x3": 50.112, "r_y3": 535.3, "coord_origin": "TOPLEFT"}, "text": "basis to build a wide range of table appearances. Lastly, the", "orig": "basis to build a wide range of table appearances. Lastly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 555.807, "r_x1": 286.365, "r_y1": 555.807, "r_x2": 286.365, "r_y2": 547.255, "r_x3": 50.112, "r_y3": 547.255, "coord_origin": "TOPLEFT"}, "text": "table content is generated out of a curated collection of text", "orig": "table content is generated out of a curated collection of text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 567.762, "r_x1": 83.028, "r_y1": 567.762, "r_x2": 83.028, "r_y2": 559.21, "r_x3": 50.112, "r_y3": 559.21, "coord_origin": "TOPLEFT"}, "text": "corpora.", "orig": "corpora.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.153, "r_y0": 567.762, "r_x1": 286.365, "r_y1": 567.762, "r_x2": 286.365, "r_y2": 559.21, "r_x3": 87.153, "r_y3": 559.21, "coord_origin": "TOPLEFT"}, "text": "By controlling the size and scope of the synthetic", "orig": "By controlling the size and scope of the synthetic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 579.717, "r_x1": 286.365, "r_y1": 579.717, "r_x2": 286.365, "r_y2": 571.165, "r_x3": 50.112, "r_y3": 571.165, "coord_origin": "TOPLEFT"}, "text": "datasets we are able to train and evaluate our models in a", "orig": "datasets we are able to train and evaluate our models in a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 591.672, "r_x1": 174.645, "r_y1": 591.672, "r_x2": 174.645, "r_y2": 583.12, "r_x3": 50.112, "r_y3": 583.12, "coord_origin": "TOPLEFT"}, "text": "variety of different conditions.", "orig": "variety of different conditions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.021, "r_y0": 591.672, "r_x1": 286.365, "r_y1": 591.672, "r_x2": 286.365, "r_y2": 583.12, "r_x3": 181.021, "r_y3": 583.12, "coord_origin": "TOPLEFT"}, "text": "For example, we can first", "orig": "For example, we can first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 603.6279999999999, "r_x1": 286.365, "r_y1": 603.6279999999999, "r_x2": 286.365, "r_y2": 595.076, "r_x3": 50.112, "r_y3": 595.076, "coord_origin": "TOPLEFT"}, "text": "generate a highly diverse dataset to train our models and", "orig": "generate a highly diverse dataset to train our models and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 615.583, "r_x1": 286.365, "r_y1": 615.583, "r_x2": 286.365, "r_y2": 607.031, "r_x3": 50.112, "r_y3": 607.031, "coord_origin": "TOPLEFT"}, "text": "then evaluate their performance on other synthetic datasets", "orig": "then evaluate their performance on other synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 627.538, "r_x1": 209.753, "r_y1": 627.538, "r_x2": 209.753, "r_y2": 618.986, "r_x3": 50.112, "r_y3": 618.986, "coord_origin": "TOPLEFT"}, "text": "which are focused on a specific domain.", "orig": "which are focused on a specific domain.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "text", "bbox": {"l": 50.112, "t": 632.783, "r": 286.365, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9871614575386047, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 641.335, "r_x1": 286.365, "r_y1": 641.335, "r_x2": 286.365, "r_y2": 632.783, "r_x3": 62.067, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "In this regard, we have prepared four synthetic datasets,", "orig": "In this regard, we have prepared four synthetic datasets,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 653.29, "r_x1": 286.365, "r_y1": 653.29, "r_x2": 286.365, "r_y2": 644.738, "r_x3": 50.112, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "each one containing 150k examples. The corpora to gener-", "orig": "each one containing 150k examples. The corpora to gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 665.246, "r_x1": 286.365, "r_y1": 665.246, "r_x2": 286.365, "r_y2": 656.694, "r_x3": 50.112, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "ate the table text consists of the most frequent terms appear-", "orig": "ate the table text consists of the most frequent terms appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.201, "r_x1": 286.365, "r_y1": 677.201, "r_x2": 286.365, "r_y2": 668.649, "r_x3": 50.112, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "ing in PubTabNet and FinTabNet together with randomly", "orig": "ing in PubTabNet and FinTabNet together with randomly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 109.519, "r_y1": 689.156, "r_x2": 109.519, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "generated text.", "orig": "generated text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 115.337, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 115.337, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "The first two synthetic datasets have been", "orig": "The first two synthetic datasets have been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "fine-tuned to mimic the appearance of the original datasets", "orig": "fine-tuned to mimic the appearance of the original datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "but encompass more complicated table structures. The third", "orig": "but encompass more complicated table structures. The third", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "table", "bbox": {"l": 310.67584228515625, "t": 73.19388580322266, "r": 542.9547119140625, "b": 155.22052001953125, "coord_origin": "TOPLEFT"}, "confidence": 0.9777463674545288, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.332, "r_y0": 82.43499999999995, "r_x1": 430.902, "r_y1": 82.43499999999995, "r_x2": 430.902, "r_y2": 73.88300000000004, "r_x3": 412.332, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.857, "r_y0": 82.43499999999995, "r_x1": 464.446, "r_y1": 82.43499999999995, "r_x2": 464.446, "r_y2": 73.88300000000004, "r_x3": 442.857, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.786, "r_y0": 82.43499999999995, "r_x1": 494.942, "r_y1": 82.43499999999995, "r_x2": 494.942, "r_y2": 73.88300000000004, "r_x3": 477.786, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 508.282, "r_y0": 82.43499999999995, "r_x1": 536.914, "r_y1": 82.43499999999995, "r_x2": 536.914, "r_y2": 73.88300000000004, "r_x3": 508.282, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 94.78800000000001, "r_x1": 361.643, "r_y1": 94.78800000000001, "r_x2": 361.643, "r_y2": 86.23599999999999, "r_x3": 317.06, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 92.72199999999998, "r_x1": 425.378, "r_y1": 92.72199999999998, "r_x2": 425.378, "r_y2": 85.668, "r_x3": 417.856, "r_y3": 85.668, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 92.72199999999998, "r_x1": 457.417, "r_y1": 92.72199999999998, "r_x2": 457.417, "r_y2": 85.668, "r_x3": 449.896, "r_y3": 85.668, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 94.78800000000001, "r_x1": 496.326, "r_y1": 94.78800000000001, "r_x2": 496.326, "r_y2": 86.23599999999999, "r_x3": 476.401, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 94.78800000000001, "r_x1": 532.56, "r_y1": 94.78800000000001, "r_x2": 532.56, "r_y2": 86.23599999999999, "r_x3": 512.635, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 106.74300000000005, "r_x1": 359.431, "r_y1": 106.74300000000005, "r_x2": 359.431, "r_y2": 98.19100000000003, "r_x3": 317.06, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 104.67700000000002, "r_x1": 425.378, "r_y1": 104.67700000000002, "r_x2": 425.378, "r_y2": 97.62300000000005, "r_x3": 417.856, "r_y3": 97.62300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 104.67700000000002, "r_x1": 457.417, "r_y1": 104.67700000000002, "r_x2": 457.417, "r_y2": 97.62300000000005, "r_x3": 449.896, "r_y3": 97.62300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 106.74300000000005, "r_x1": 496.326, "r_y1": 106.74300000000005, "r_x2": 496.326, "r_y2": 98.19100000000003, "r_x3": 476.401, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.462, "r_y0": 106.74300000000005, "r_x1": 531.733, "r_y1": 106.74300000000005, "r_x2": 531.733, "r_y2": 98.19100000000003, "r_x3": 513.462, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 118.69899999999996, "r_x1": 359.979, "r_y1": 118.69899999999996, "r_x2": 359.979, "r_y2": 110.14700000000005, "r_x3": 317.06, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 116.63300000000004, "r_x1": 425.378, "r_y1": 116.63300000000004, "r_x2": 425.378, "r_y2": 109.57899999999995, "r_x3": 417.856, "r_y3": 109.57899999999995, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.812, "r_y0": 116.63300000000004, "r_x1": 456.501, "r_y1": 116.63300000000004, "r_x2": 456.501, "r_y2": 109.57899999999995, "r_x3": 450.812, "r_y3": 109.57899999999995, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 118.69899999999996, "r_x1": 496.326, "r_y1": 118.69899999999996, "r_x2": 496.326, "r_y2": 110.14700000000005, "r_x3": 476.401, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 511.25, "r_y0": 118.69899999999996, "r_x1": 533.945, "r_y1": 118.69899999999996, "r_x2": 533.945, "r_y2": 110.14700000000005, "r_x3": 511.25, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 130.654, "r_x1": 400.377, "r_y1": 130.654, "r_x2": 400.377, "r_y2": 122.10199999999998, "r_x3": 317.06, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 128.58799999999997, "r_x1": 425.378, "r_y1": 128.58799999999997, "r_x2": 425.378, "r_y2": 121.53399999999999, "r_x3": 417.856, "r_y3": 121.53399999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 128.58799999999997, "r_x1": 457.417, "r_y1": 128.58799999999997, "r_x2": 457.417, "r_y2": 121.53399999999999, "r_x3": 449.896, "r_y3": 121.53399999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 130.654, "r_x1": 496.326, "r_y1": 130.654, "r_x2": 496.326, "r_y2": 122.10199999999998, "r_x3": 476.401, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 130.654, "r_x1": 532.56, "r_y1": 130.654, "r_x2": 532.56, "r_y2": 122.10199999999998, "r_x3": 512.635, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 142.60900000000004, "r_x1": 375.172, "r_y1": 142.60900000000004, "r_x2": 375.172, "r_y2": 134.05700000000002, "r_x3": 317.06, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 140.543, "r_x1": 425.378, "r_y1": 140.543, "r_x2": 425.378, "r_y2": 133.48900000000003, "r_x3": 417.856, "r_y3": 133.48900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 140.543, "r_x1": 457.417, "r_y1": 140.543, "r_x2": 457.417, "r_y2": 133.48900000000003, "r_x3": 449.896, "r_y3": 133.48900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 142.60900000000004, "r_x1": 496.326, "r_y1": 142.60900000000004, "r_x2": 496.326, "r_y2": 134.05700000000002, "r_x3": 476.401, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 142.60900000000004, "r_x1": 532.56, "r_y1": 142.60900000000004, "r_x2": 532.56, "r_y2": 134.05700000000002, "r_x3": 512.635, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 154.56399999999996, "r_x1": 369.394, "r_y1": 154.56399999999996, "r_x2": 369.394, "r_y2": 146.01199999999994, "r_x3": 317.06, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 152.49800000000005, "r_x1": 425.378, "r_y1": 152.49800000000005, "r_x2": 425.378, "r_y2": 145.44399999999996, "r_x3": 417.856, "r_y3": 145.44399999999996, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 152.49800000000005, "r_x1": 457.417, "r_y1": 152.49800000000005, "r_x2": 457.417, "r_y2": 145.44399999999996, "r_x3": 449.896, "r_y3": 145.44399999999996, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 154.56399999999996, "r_x1": 496.326, "r_y1": 154.56399999999996, "r_x2": 496.326, "r_y2": 146.01199999999994, "r_x3": 476.401, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 154.56399999999996, "r_x1": 532.56, "r_y1": 154.56399999999996, "r_x2": 532.56, "r_y2": 146.01199999999994, "r_x3": 512.635, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 17, "label": "text", "bbox": {"l": 412.332, "t": 73.88300000000004, "r": 430.902, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.332, "r_y0": 82.43499999999995, "r_x1": 430.902, "r_y1": 82.43499999999995, "r_x2": 430.902, "r_y2": 73.88300000000004, "r_x3": 412.332, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 442.857, "t": 73.88300000000004, "r": 464.446, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.857, "r_y0": 82.43499999999995, "r_x1": 464.446, "r_y1": 82.43499999999995, "r_x2": 464.446, "r_y2": 73.88300000000004, "r_x3": 442.857, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 477.786, "t": 73.88300000000004, "r": 494.942, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.786, "r_y0": 82.43499999999995, "r_x1": 494.942, "r_y1": 82.43499999999995, "r_x2": 494.942, "r_y2": 73.88300000000004, "r_x3": 477.786, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 508.282, "t": 73.88300000000004, "r": 536.914, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 508.282, "r_y0": 82.43499999999995, "r_x1": 536.914, "r_y1": 82.43499999999995, "r_x2": 536.914, "r_y2": 73.88300000000004, "r_x3": 508.282, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 317.06, "t": 86.23599999999999, "r": 361.643, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 94.78800000000001, "r_x1": 361.643, "r_y1": 94.78800000000001, "r_x2": 361.643, "r_y2": 86.23599999999999, "r_x3": 317.06, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 417.856, "t": 85.668, "r": 425.378, "b": 92.72199999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 92.72199999999998, "r_x1": 425.378, "r_y1": 92.72199999999998, "r_x2": 425.378, "r_y2": 85.668, "r_x3": 417.856, "r_y3": 85.668, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 449.896, "t": 85.668, "r": 457.417, "b": 92.72199999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 92.72199999999998, "r_x1": 457.417, "r_y1": 92.72199999999998, "r_x2": 457.417, "r_y2": 85.668, "r_x3": 449.896, "r_y3": 85.668, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 476.401, "t": 86.23599999999999, "r": 496.326, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 94.78800000000001, "r_x1": 496.326, "r_y1": 94.78800000000001, "r_x2": 496.326, "r_y2": 86.23599999999999, "r_x3": 476.401, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 512.635, "t": 86.23599999999999, "r": 532.56, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 94.78800000000001, "r_x1": 532.56, "r_y1": 94.78800000000001, "r_x2": 532.56, "r_y2": 86.23599999999999, "r_x3": 512.635, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 317.06, "t": 98.19100000000003, "r": 359.431, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 106.74300000000005, "r_x1": 359.431, "r_y1": 106.74300000000005, "r_x2": 359.431, "r_y2": 98.19100000000003, "r_x3": 317.06, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 417.856, "t": 97.62300000000005, "r": 425.378, "b": 104.67700000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 104.67700000000002, "r_x1": 425.378, "r_y1": 104.67700000000002, "r_x2": 425.378, "r_y2": 97.62300000000005, "r_x3": 417.856, "r_y3": 97.62300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 449.896, "t": 97.62300000000005, "r": 457.417, "b": 104.67700000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 104.67700000000002, "r_x1": 457.417, "r_y1": 104.67700000000002, "r_x2": 457.417, "r_y2": 97.62300000000005, "r_x3": 449.896, "r_y3": 97.62300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 476.401, "t": 98.19100000000003, "r": 496.326, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 106.74300000000005, "r_x1": 496.326, "r_y1": 106.74300000000005, "r_x2": 496.326, "r_y2": 98.19100000000003, "r_x3": 476.401, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 513.462, "t": 98.19100000000003, "r": 531.733, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.462, "r_y0": 106.74300000000005, "r_x1": 531.733, "r_y1": 106.74300000000005, "r_x2": 531.733, "r_y2": 98.19100000000003, "r_x3": 513.462, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 317.06, "t": 110.14700000000005, "r": 359.979, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 118.69899999999996, "r_x1": 359.979, "r_y1": 118.69899999999996, "r_x2": 359.979, "r_y2": 110.14700000000005, "r_x3": 317.06, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 417.856, "t": 109.57899999999995, "r": 425.378, "b": 116.63300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 116.63300000000004, "r_x1": 425.378, "r_y1": 116.63300000000004, "r_x2": 425.378, "r_y2": 109.57899999999995, "r_x3": 417.856, "r_y3": 109.57899999999995, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 450.812, "t": 109.57899999999995, "r": 456.501, "b": 116.63300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.812, "r_y0": 116.63300000000004, "r_x1": 456.501, "r_y1": 116.63300000000004, "r_x2": 456.501, "r_y2": 109.57899999999995, "r_x3": 450.812, "r_y3": 109.57899999999995, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 476.401, "t": 110.14700000000005, "r": 496.326, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 118.69899999999996, "r_x1": 496.326, "r_y1": 118.69899999999996, "r_x2": 496.326, "r_y2": 110.14700000000005, "r_x3": 476.401, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 511.25, "t": 110.14700000000005, "r": 533.945, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 511.25, "r_y0": 118.69899999999996, "r_x1": 533.945, "r_y1": 118.69899999999996, "r_x2": 533.945, "r_y2": 110.14700000000005, "r_x3": 511.25, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 317.06, "t": 122.10199999999998, "r": 400.377, "b": 130.654, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 130.654, "r_x1": 400.377, "r_y1": 130.654, "r_x2": 400.377, "r_y2": 122.10199999999998, "r_x3": 317.06, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 417.856, "t": 121.53399999999999, "r": 425.378, "b": 128.58799999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 128.58799999999997, "r_x1": 425.378, "r_y1": 128.58799999999997, "r_x2": 425.378, "r_y2": 121.53399999999999, "r_x3": 417.856, "r_y3": 121.53399999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 449.896, "t": 121.53399999999999, "r": 457.417, "b": 128.58799999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 128.58799999999997, "r_x1": 457.417, "r_y1": 128.58799999999997, "r_x2": 457.417, "r_y2": 121.53399999999999, "r_x3": 449.896, "r_y3": 121.53399999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 476.401, "t": 122.10199999999998, "r": 496.326, "b": 130.654, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 130.654, "r_x1": 496.326, "r_y1": 130.654, "r_x2": 496.326, "r_y2": 122.10199999999998, "r_x3": 476.401, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 512.635, "t": 122.10199999999998, "r": 532.56, "b": 130.654, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 130.654, "r_x1": 532.56, "r_y1": 130.654, "r_x2": 532.56, "r_y2": 122.10199999999998, "r_x3": 512.635, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 317.06, "t": 134.05700000000002, "r": 375.172, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 142.60900000000004, "r_x1": 375.172, "r_y1": 142.60900000000004, "r_x2": 375.172, "r_y2": 134.05700000000002, "r_x3": 317.06, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 417.856, "t": 133.48900000000003, "r": 425.378, "b": 140.543, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 140.543, "r_x1": 425.378, "r_y1": 140.543, "r_x2": 425.378, "r_y2": 133.48900000000003, "r_x3": 417.856, "r_y3": 133.48900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 449.896, "t": 133.48900000000003, "r": 457.417, "b": 140.543, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 140.543, "r_x1": 457.417, "r_y1": 140.543, "r_x2": 457.417, "r_y2": 133.48900000000003, "r_x3": 449.896, "r_y3": 133.48900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 476.401, "t": 134.05700000000002, "r": 496.326, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 142.60900000000004, "r_x1": 496.326, "r_y1": 142.60900000000004, "r_x2": 496.326, "r_y2": 134.05700000000002, "r_x3": 476.401, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 512.635, "t": 134.05700000000002, "r": 532.56, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 142.60900000000004, "r_x1": 532.56, "r_y1": 142.60900000000004, "r_x2": 532.56, "r_y2": 134.05700000000002, "r_x3": 512.635, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 317.06, "t": 146.01199999999994, "r": 369.394, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 154.56399999999996, "r_x1": 369.394, "r_y1": 154.56399999999996, "r_x2": 369.394, "r_y2": 146.01199999999994, "r_x3": 317.06, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 417.856, "t": 145.44399999999996, "r": 425.378, "b": 152.49800000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 152.49800000000005, "r_x1": 425.378, "r_y1": 152.49800000000005, "r_x2": 425.378, "r_y2": 145.44399999999996, "r_x3": 417.856, "r_y3": 145.44399999999996, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 449.896, "t": 145.44399999999996, "r": 457.417, "b": 152.49800000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 152.49800000000005, "r_x1": 457.417, "r_y1": 152.49800000000005, "r_x2": 457.417, "r_y2": 145.44399999999996, "r_x3": 449.896, "r_y3": 145.44399999999996, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 476.401, "t": 146.01199999999994, "r": 496.326, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 154.56399999999996, "r_x1": 496.326, "r_y1": 154.56399999999996, "r_x2": 496.326, "r_y2": 146.01199999999994, "r_x3": 476.401, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 512.635, "t": 146.01199999999994, "r": 532.56, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 154.56399999999996, "r_x1": 532.56, "r_y1": 154.56399999999996, "r_x2": 532.56, "r_y2": 146.01199999999994, "r_x3": 512.635, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 9, "label": "caption", "bbox": {"l": 308.862, "t": 167.75099999999998, "r": 545.115, "b": 224.303, "coord_origin": "TOPLEFT"}, "confidence": 0.9667726755142212, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 176.48199999999997, "r_x1": 330.75, "r_y1": 176.48199999999997, "r_x2": 330.75, "r_y2": 167.92999999999995, "r_x3": 308.862, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 336.867, "r_y0": 176.48199999999997, "r_x1": 344.618, "r_y1": 176.48199999999997, "r_x2": 344.618, "r_y2": 167.92999999999995, "r_x3": 336.867, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "1:", "orig": "1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 361.076, "r_y0": 176.48199999999997, "r_x1": 380.453, "r_y1": 176.48199999999997, "r_x2": 380.453, "r_y2": 167.92999999999995, "r_x3": 361.076, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "Both", "orig": "Both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.568, "r_y0": 176.33900000000006, "r_x1": 468.68, "r_y1": 176.33900000000006, "r_x2": 468.68, "r_y2": 167.75099999999998, "r_x3": 386.568, "r_y3": 167.75099999999998, "coord_origin": "TOPLEFT"}, "text": "'Combined-Tabnet'", "orig": "'Combined-Tabnet'", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 474.796, "r_y0": 176.48199999999997, "r_x1": 489.182, "r_y1": 176.48199999999997, "r_x2": 489.182, "r_y2": 167.92999999999995, "r_x3": 474.796, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 495.299, "r_y0": 176.33900000000006, "r_x1": 545.112, "r_y1": 176.33900000000006, "r_x2": 545.112, "r_y2": 167.75099999999998, "r_x3": 495.299, "r_y3": 167.75099999999998, "coord_origin": "TOPLEFT"}, "text": "'Combined-", "orig": "'Combined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 188.29399999999998, "r_x1": 341.161, "r_y1": 188.29399999999998, "r_x2": 341.161, "r_y2": 179.70600000000002, "r_x3": 308.862, "r_y3": 179.70600000000002, "coord_origin": "TOPLEFT"}, "text": "Tabnet'", "orig": "Tabnet'", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 343.457, "r_y0": 188.437, "r_x1": 545.11, "r_y1": 188.437, "r_x2": 545.11, "r_y2": 179.885, "r_x3": 343.457, "r_y3": 179.885, "coord_origin": "TOPLEFT"}, "text": "are variations of the following: (*) The Combined-", "orig": "are variations of the following: (*) The Combined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 200.39200000000005, "r_x1": 545.115, "r_y1": 200.39200000000005, "r_x2": 545.115, "r_y2": 191.84000000000003, "r_x3": 308.862, "r_y3": 191.84000000000003, "coord_origin": "TOPLEFT"}, "text": "Tabnet dataset is the processed combination of PubTabNet", "orig": "Tabnet dataset is the processed combination of PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 212.34699999999998, "r_x1": 366.276, "r_y1": 212.34699999999998, "r_x2": 366.276, "r_y2": 203.79499999999996, "r_x3": 308.862, "r_y3": 203.79499999999996, "coord_origin": "TOPLEFT"}, "text": "and Fintabnet.", "orig": "and Fintabnet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 370.58, "r_y0": 212.34699999999998, "r_x1": 545.115, "r_y1": 212.34699999999998, "r_x2": 545.115, "r_y2": 203.79499999999996, "r_x3": 370.58, "r_y3": 203.79499999999996, "coord_origin": "TOPLEFT"}, "text": "(**) The combined dataset is the processed", "orig": "(**) The combined dataset is the processed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 224.303, "r_x1": 523.935, "r_y1": 224.303, "r_x2": 523.935, "r_y2": 215.75099999999998, "r_x3": 308.862, "r_y3": 215.75099999999998, "coord_origin": "TOPLEFT"}, "text": "combination of PubTabNet, Fintabnet and TableBank.", "orig": "combination of PubTabNet, Fintabnet and TableBank.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "text", "bbox": {"l": 308.862, "t": 249.889, "r": 545.115, "b": 294.306, "coord_origin": "TOPLEFT"}, "confidence": 0.978954017162323, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.44100000000003, "r_x1": 545.115, "r_y1": 258.44100000000003, "r_x2": 545.115, "r_y2": 249.889, "r_x3": 308.862, "r_y3": 249.889, "coord_origin": "TOPLEFT"}, "text": "one adopts a colorful appearance with high contrast and the", "orig": "one adopts a colorful appearance with high contrast and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 270.39599999999996, "r_x1": 545.115, "r_y1": 270.39599999999996, "r_x2": 545.115, "r_y2": 261.84400000000005, "r_x3": 308.862, "r_y3": 261.84400000000005, "coord_origin": "TOPLEFT"}, "text": "last one contains tables with sparse content. Lastly, we have", "orig": "last one contains tables with sparse content. Lastly, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 282.351, "r_x1": 545.115, "r_y1": 282.351, "r_x2": 545.115, "r_y2": 273.799, "r_x3": 308.862, "r_y3": 273.799, "coord_origin": "TOPLEFT"}, "text": "combined all synthetic datasets into one big unified syn-", "orig": "combined all synthetic datasets into one big unified syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 294.306, "r_x1": 436.822, "r_y1": 294.306, "r_x2": 436.822, "r_y2": 285.754, "r_x3": 308.862, "r_y3": 285.754, "coord_origin": "TOPLEFT"}, "text": "thetic dataset of 600k examples.", "orig": "thetic dataset of 600k examples.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "text", "bbox": {"l": 320.817, "t": 298.041, "r": 542.744, "b": 306.593, "coord_origin": "TOPLEFT"}, "confidence": 0.9043695330619812, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 306.593, "r_x1": 542.744, "r_y1": 306.593, "r_x2": 542.744, "r_y2": 298.041, "r_x3": 320.817, "r_y3": 298.041, "coord_origin": "TOPLEFT"}, "text": "Tab. 1 summarizes the various attributes of the datasets.", "orig": "Tab. 1 summarizes the various attributes of the datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "section_header", "bbox": {"l": 308.862, "t": 321.184, "r": 444.936, "b": 331.932, "coord_origin": "TOPLEFT"}, "confidence": 0.9466595649719238, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 331.932, "r_x1": 444.936, "r_y1": 331.932, "r_x2": 444.936, "r_y2": 321.184, "r_x3": 308.862, "r_y3": 321.184, "coord_origin": "TOPLEFT"}, "text": "4. The TableFormer model", "orig": "4. The TableFormer model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 308.862, "t": 342.208, "r": 545.115, "b": 446.401, "coord_origin": "TOPLEFT"}, "confidence": 0.9884450435638428, "cells": [{"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 350.76, "r_x1": 545.115, "r_y1": 350.76, "r_x2": 545.115, "r_y2": 342.208, "r_x3": 320.817, "r_y3": 342.208, "coord_origin": "TOPLEFT"}, "text": "Given the image of a table, TableFormer is able to pre-", "orig": "Given the image of a table, TableFormer is able to pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 362.715, "r_x1": 326.576, "r_y1": 362.715, "r_x2": 326.576, "r_y2": 354.163, "r_x3": 308.862, "r_y3": 354.163, "coord_origin": "TOPLEFT"}, "text": "dict:", "orig": "dict:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.172, "r_y0": 362.715, "r_x1": 545.115, "r_y1": 362.715, "r_x2": 545.115, "r_y2": 354.163, "r_x3": 330.172, "r_y3": 354.163, "coord_origin": "TOPLEFT"}, "text": "1) a sequence of tokens that represent the structure of", "orig": "1) a sequence of tokens that represent the structure of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 374.67, "r_x1": 545.115, "r_y1": 374.67, "r_x2": 545.115, "r_y2": 366.118, "r_x3": 308.862, "r_y3": 366.118, "coord_origin": "TOPLEFT"}, "text": "a table, and 2) a bounding box coupled to a subset of those", "orig": "a table, and 2) a bounding box coupled to a subset of those", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 386.625, "r_x1": 337.265, "r_y1": 386.625, "r_x2": 337.265, "r_y2": 378.073, "r_x3": 308.862, "r_y3": 378.073, "coord_origin": "TOPLEFT"}, "text": "tokens.", "orig": "tokens.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.808, "r_y0": 386.625, "r_x1": 545.115, "r_y1": 386.625, "r_x2": 545.115, "r_y2": 378.073, "r_x3": 341.808, "r_y3": 378.073, "coord_origin": "TOPLEFT"}, "text": "The conversion of an image into a sequence of to-", "orig": "The conversion of an image into a sequence of to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 398.58, "r_x1": 545.115, "r_y1": 398.58, "r_x2": 545.115, "r_y2": 390.028, "r_x3": 308.862, "r_y3": 390.028, "coord_origin": "TOPLEFT"}, "text": "kens is a well-known task [35, 16]. While attention is often", "orig": "kens is a well-known task [35, 16]. While attention is often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 410.535, "r_x1": 545.115, "r_y1": 410.535, "r_x2": 545.115, "r_y2": 401.983, "r_x3": 308.862, "r_y3": 401.983, "coord_origin": "TOPLEFT"}, "text": "used as an implicit method to associate each token of the", "orig": "used as an implicit method to associate each token of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 422.491, "r_x1": 545.115, "r_y1": 422.491, "r_x2": 545.115, "r_y2": 413.939, "r_x3": 308.862, "r_y3": 413.939, "coord_origin": "TOPLEFT"}, "text": "sequence with a position in the original image, an explicit", "orig": "sequence with a position in the original image, an explicit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 434.446, "r_x1": 545.115, "r_y1": 434.446, "r_x2": 545.115, "r_y2": 425.894, "r_x3": 308.862, "r_y3": 425.894, "coord_origin": "TOPLEFT"}, "text": "association between the individual table-cells and the image", "orig": "association between the individual table-cells and the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 446.401, "r_x1": 437.937, "r_y1": 446.401, "r_x2": 437.937, "r_y2": 437.849, "r_x3": 308.862, "r_y3": 437.849, "coord_origin": "TOPLEFT"}, "text": "bounding boxes is also required.", "orig": "bounding boxes is also required.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "section_header", "bbox": {"l": 308.862, "t": 457.694, "r": 420.161, "b": 467.546, "coord_origin": "TOPLEFT"}, "confidence": 0.937696099281311, "cells": [{"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 467.546, "r_x1": 420.161, "r_y1": 467.546, "r_x2": 420.161, "r_y2": 457.694, "r_x3": 308.862, "r_y3": 457.694, "coord_origin": "TOPLEFT"}, "text": "4.1. Model architecture.", "orig": "4.1. Model architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 308.862, "t": 477.034, "r": 545.116, "b": 664.914, "coord_origin": "TOPLEFT"}, "confidence": 0.9878323078155518, "cells": [{"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 485.586, "r_x1": 545.115, "r_y1": 485.586, "r_x2": 545.115, "r_y2": 477.034, "r_x3": 320.817, "r_y3": 477.034, "coord_origin": "TOPLEFT"}, "text": "We now describe in detail the proposed method, which", "orig": "We now describe in detail the proposed method, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 497.541, "r_x1": 315.507, "r_y1": 497.541, "r_x2": 315.507, "r_y2": 488.989, "r_x3": 308.862, "r_y3": 488.989, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 319.153, "r_y0": 497.541, "r_x1": 509.021, "r_y1": 497.541, "r_x2": 509.021, "r_y2": 488.989, "r_x3": 319.153, "r_y3": 488.989, "coord_origin": "TOPLEFT"}, "text": "composed of three main components, see Fig.", "orig": "composed of three main components, see Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.586, "r_y0": 497.541, "r_x1": 523.058, "r_y1": 497.541, "r_x2": 523.058, "r_y2": 488.989, "r_x3": 515.586, "r_y3": 488.989, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 529.623, "r_y0": 497.541, "r_x1": 545.115, "r_y1": 497.541, "r_x2": 545.115, "r_y2": 488.989, "r_x3": 529.623, "r_y3": 488.989, "coord_origin": "TOPLEFT"}, "text": "Our", "orig": "Our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 509.353, "r_x1": 406.346, "r_y1": 509.353, "r_x2": 406.346, "r_y2": 500.765, "r_x3": 308.862, "r_y3": 500.765, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.872, "r_y0": 509.496, "r_x1": 545.111, "r_y1": 509.496, "r_x2": 545.111, "r_y2": 500.944, "r_x3": 408.872, "r_y3": 500.944, "coord_origin": "TOPLEFT"}, "text": "encodes the input as a feature vec-", "orig": "encodes the input as a feature vec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 521.452, "r_x1": 319.93, "r_y1": 521.452, "r_x2": 319.93, "r_y2": 512.9, "r_x3": 308.862, "r_y3": 512.9, "coord_origin": "TOPLEFT"}, "text": "tor", "orig": "tor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.836, "r_y0": 521.452, "r_x1": 409.395, "r_y1": 521.452, "r_x2": 409.395, "r_y2": 512.9, "r_x3": 323.836, "r_y3": 512.9, "coord_origin": "TOPLEFT"}, "text": "of predefined length.", "orig": "of predefined length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.727, "r_y0": 521.452, "r_x1": 545.115, "r_y1": 521.452, "r_x2": 545.115, "r_y2": 512.9, "r_x3": 416.727, "r_y3": 512.9, "coord_origin": "TOPLEFT"}, "text": "The input feature vector of the", "orig": "The input feature vector of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.4069999999999, "r_x1": 436.194, "r_y1": 533.4069999999999, "r_x2": 436.194, "r_y2": 524.855, "r_x3": 308.862, "r_y3": 524.855, "coord_origin": "TOPLEFT"}, "text": "encoded image is passed to the", "orig": "encoded image is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.526, "r_y0": 533.264, "r_x1": 513.867, "r_y1": 533.264, "r_x2": 513.867, "r_y2": 524.6759999999999, "r_x3": 439.526, "r_y3": 524.6759999999999, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 517.432, "r_y0": 533.4069999999999, "r_x1": 545.108, "r_y1": 533.4069999999999, "r_x2": 545.108, "r_y2": 524.855, "r_x3": 517.432, "r_y3": 524.855, "coord_origin": "TOPLEFT"}, "text": "to pro-", "orig": "to pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.362, "r_x1": 545.115, "r_y1": 545.362, "r_x2": 545.115, "r_y2": 536.81, "r_x3": 308.862, "r_y3": 536.81, "coord_origin": "TOPLEFT"}, "text": "duce a sequence of HTML tags that represent the structure", "orig": "duce a sequence of HTML tags that represent the structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 557.317, "r_x1": 358.545, "r_y1": 557.317, "r_x2": 358.545, "r_y2": 548.765, "r_x3": 308.862, "r_y3": 548.765, "coord_origin": "TOPLEFT"}, "text": "of the table.", "orig": "of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.191, "r_y0": 557.317, "r_x1": 545.115, "r_y1": 557.317, "r_x2": 545.115, "r_y2": 548.765, "r_x3": 365.191, "r_y3": 548.765, "coord_origin": "TOPLEFT"}, "text": "With each prediction of an HTML standard", "orig": "With each prediction of an HTML standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.2719999999999, "r_x1": 352.409, "r_y1": 569.2719999999999, "r_x2": 352.409, "r_y2": 560.72, "r_x3": 308.862, "r_y3": 560.72, "coord_origin": "TOPLEFT"}, "text": "data cell ('", "orig": "data cell ('", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 352.409, "r_y0": 569.108, "r_x1": 360.158, "r_y1": 569.108, "r_x2": 360.158, "r_y2": 560.402, "r_x3": 352.409, "r_y3": 560.402, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.158, "r_y0": 569.2719999999999, "r_x1": 367.909, "r_y1": 569.2719999999999, "r_x2": 367.909, "r_y2": 560.72, "r_x3": 360.158, "r_y3": 560.72, "coord_origin": "TOPLEFT"}, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.909, "r_y0": 569.108, "r_x1": 375.658, "r_y1": 569.108, "r_x2": 375.658, "r_y2": 560.402, "r_x3": 367.909, "r_y3": 560.402, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.658, "r_y0": 569.2719999999999, "r_x1": 545.112, "r_y1": 569.2719999999999, "r_x2": 545.112, "r_y2": 560.72, "r_x3": 375.658, "r_y3": 560.72, "coord_origin": "TOPLEFT"}, "text": "') the hidden state of that cell is passed to", "orig": "') the hidden state of that cell is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 581.2280000000001, "r_x1": 545.115, "r_y1": 581.2280000000001, "r_x2": 545.115, "r_y2": 572.6759999999999, "r_x3": 308.862, "r_y3": 572.6759999999999, "coord_origin": "TOPLEFT"}, "text": "the Cell BBox Decoder. As for spanning cells, such as row", "orig": "the Cell BBox Decoder. As for spanning cells, such as row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 593.183, "r_x1": 483.118, "r_y1": 593.183, "r_x2": 483.118, "r_y2": 584.631, "r_x3": 308.862, "r_y3": 584.631, "coord_origin": "TOPLEFT"}, "text": "or column span, the tag is broken down to '", "orig": "or column span, the tag is broken down to '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.119, "r_y0": 593.019, "r_x1": 490.868, "r_y1": 593.019, "r_x2": 490.868, "r_y2": 584.313, "r_x3": 483.119, "r_y3": 584.313, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.868, "r_y0": 593.183, "r_x1": 545.114, "r_y1": 593.183, "r_x2": 545.114, "r_y2": 584.631, "r_x3": 490.868, "r_y3": 584.631, "coord_origin": "TOPLEFT"}, "text": "', 'rowspan='", "orig": "', 'rowspan='", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.138, "r_x1": 545.115, "r_y1": 605.138, "r_x2": 545.115, "r_y2": 596.586, "r_x3": 308.862, "r_y3": 596.586, "coord_origin": "TOPLEFT"}, "text": "or 'colspan=', with the number of spanning cells (attribute),", "orig": "or 'colspan=', with the number of spanning cells (attribute),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.093, "r_x1": 329.644, "r_y1": 617.093, "r_x2": 329.644, "r_y2": 608.5409999999999, "r_x3": 308.862, "r_y3": 608.5409999999999, "coord_origin": "TOPLEFT"}, "text": "and '", "orig": "and '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 329.646, "r_y0": 616.929, "r_x1": 337.395, "r_y1": 616.929, "r_x2": 337.395, "r_y2": 608.223, "r_x3": 329.646, "r_y3": 608.223, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.394, "r_y0": 617.093, "r_x1": 343.202, "r_y1": 617.093, "r_x2": 343.202, "r_y2": 608.5409999999999, "r_x3": 337.394, "r_y3": 608.5409999999999, "coord_origin": "TOPLEFT"}, "text": "'.", "orig": "'.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.064, "r_y0": 617.093, "r_x1": 468.591, "r_y1": 617.093, "r_x2": 468.591, "r_y2": 608.5409999999999, "r_x3": 348.064, "r_y3": 608.5409999999999, "coord_origin": "TOPLEFT"}, "text": "The hidden state attached to '", "orig": "The hidden state attached to '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.595, "r_y0": 616.929, "r_x1": 476.344, "r_y1": 616.929, "r_x2": 476.344, "r_y2": 608.223, "r_x3": 468.595, "r_y3": 608.223, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.344, "r_y0": 617.093, "r_x1": 545.116, "r_y1": 617.093, "r_x2": 545.116, "r_y2": 608.5409999999999, "r_x3": 476.344, "r_y3": 608.5409999999999, "coord_origin": "TOPLEFT"}, "text": "' is passed to the", "orig": "' is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.048, "r_x1": 545.115, "r_y1": 629.048, "r_x2": 545.115, "r_y2": 620.496, "r_x3": 308.862, "r_y3": 620.496, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder. A shared feed forward network (FFN)", "orig": "Cell BBox Decoder. A shared feed forward network (FFN)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.0029999999999, "r_x1": 533.2, "r_y1": 641.0029999999999, "r_x2": 533.2, "r_y2": 632.451, "r_x3": 308.862, "r_y3": 632.451, "coord_origin": "TOPLEFT"}, "text": "receives the hidden states from the Structure Decoder,", "orig": "receives the hidden states from the Structure Decoder,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 537.364, "r_y0": 641.0029999999999, "r_x1": 545.115, "r_y1": 641.0029999999999, "r_x2": 545.115, "r_y2": 632.451, "r_x3": 537.364, "r_y3": 632.451, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 652.9590000000001, "r_x1": 545.115, "r_y1": 652.9590000000001, "r_x2": 545.115, "r_y2": 644.407, "r_x3": 308.862, "r_y3": 644.407, "coord_origin": "TOPLEFT"}, "text": "provide the final detection predictions of the bounding box", "orig": "provide the final detection predictions of the bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 664.914, "r_x1": 449.424, "r_y1": 664.914, "r_x2": 449.424, "r_y2": 656.362, "r_x3": 308.862, "r_y3": 656.362, "coord_origin": "TOPLEFT"}, "text": "coordinates and their classification.", "orig": "coordinates and their classification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "text", "bbox": {"l": 308.862, "t": 668.261, "r": 545.115, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.978580117225647, "cells": [{"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 677.217, "r_x1": 431.91, "r_y1": 677.217, "r_x2": 431.91, "r_y2": 668.261, "r_x3": 320.817, "r_y3": 668.261, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network.", "orig": "CNN Backbone Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.499, "r_y0": 677.201, "r_x1": 545.113, "r_y1": 677.201, "r_x2": 545.113, "r_y2": 668.649, "r_x3": 439.499, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "A ResNet-18 CNN is the", "orig": "A ResNet-18 CNN is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 308.862, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "backbone that receives the table image and encodes it as a", "orig": "backbone that receives the table image and encodes it as a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "vector of predefined length. The network has been modified", "orig": "vector of predefined length. The network has been modified", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "by removing the linear and pooling layer, as we are not per-", "orig": "by removing the linear and pooling layer, as we are not per-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8565718531608582, "cells": [{"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {"8": {"label": "table", "id": 8, "page_no": 3, "cluster": {"id": 8, "label": "table", "bbox": {"l": 310.67584228515625, "t": 73.19388580322266, "r": 542.9547119140625, "b": 155.22052001953125, "coord_origin": "TOPLEFT"}, "confidence": 0.9777463674545288, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.332, "r_y0": 82.43499999999995, "r_x1": 430.902, "r_y1": 82.43499999999995, "r_x2": 430.902, "r_y2": 73.88300000000004, "r_x3": 412.332, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.857, "r_y0": 82.43499999999995, "r_x1": 464.446, "r_y1": 82.43499999999995, "r_x2": 464.446, "r_y2": 73.88300000000004, "r_x3": 442.857, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.786, "r_y0": 82.43499999999995, "r_x1": 494.942, "r_y1": 82.43499999999995, "r_x2": 494.942, "r_y2": 73.88300000000004, "r_x3": 477.786, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 508.282, "r_y0": 82.43499999999995, "r_x1": 536.914, "r_y1": 82.43499999999995, "r_x2": 536.914, "r_y2": 73.88300000000004, "r_x3": 508.282, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 94.78800000000001, "r_x1": 361.643, "r_y1": 94.78800000000001, "r_x2": 361.643, "r_y2": 86.23599999999999, "r_x3": 317.06, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 92.72199999999998, "r_x1": 425.378, "r_y1": 92.72199999999998, "r_x2": 425.378, "r_y2": 85.668, "r_x3": 417.856, "r_y3": 85.668, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 92.72199999999998, "r_x1": 457.417, "r_y1": 92.72199999999998, "r_x2": 457.417, "r_y2": 85.668, "r_x3": 449.896, "r_y3": 85.668, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 94.78800000000001, "r_x1": 496.326, "r_y1": 94.78800000000001, "r_x2": 496.326, "r_y2": 86.23599999999999, "r_x3": 476.401, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 94.78800000000001, "r_x1": 532.56, "r_y1": 94.78800000000001, "r_x2": 532.56, "r_y2": 86.23599999999999, "r_x3": 512.635, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 106.74300000000005, "r_x1": 359.431, "r_y1": 106.74300000000005, "r_x2": 359.431, "r_y2": 98.19100000000003, "r_x3": 317.06, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 104.67700000000002, "r_x1": 425.378, "r_y1": 104.67700000000002, "r_x2": 425.378, "r_y2": 97.62300000000005, "r_x3": 417.856, "r_y3": 97.62300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 104.67700000000002, "r_x1": 457.417, "r_y1": 104.67700000000002, "r_x2": 457.417, "r_y2": 97.62300000000005, "r_x3": 449.896, "r_y3": 97.62300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 106.74300000000005, "r_x1": 496.326, "r_y1": 106.74300000000005, "r_x2": 496.326, "r_y2": 98.19100000000003, "r_x3": 476.401, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.462, "r_y0": 106.74300000000005, "r_x1": 531.733, "r_y1": 106.74300000000005, "r_x2": 531.733, "r_y2": 98.19100000000003, "r_x3": 513.462, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 118.69899999999996, "r_x1": 359.979, "r_y1": 118.69899999999996, "r_x2": 359.979, "r_y2": 110.14700000000005, "r_x3": 317.06, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 116.63300000000004, "r_x1": 425.378, "r_y1": 116.63300000000004, "r_x2": 425.378, "r_y2": 109.57899999999995, "r_x3": 417.856, "r_y3": 109.57899999999995, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.812, "r_y0": 116.63300000000004, "r_x1": 456.501, "r_y1": 116.63300000000004, "r_x2": 456.501, "r_y2": 109.57899999999995, "r_x3": 450.812, "r_y3": 109.57899999999995, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 118.69899999999996, "r_x1": 496.326, "r_y1": 118.69899999999996, "r_x2": 496.326, "r_y2": 110.14700000000005, "r_x3": 476.401, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 511.25, "r_y0": 118.69899999999996, "r_x1": 533.945, "r_y1": 118.69899999999996, "r_x2": 533.945, "r_y2": 110.14700000000005, "r_x3": 511.25, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 130.654, "r_x1": 400.377, "r_y1": 130.654, "r_x2": 400.377, "r_y2": 122.10199999999998, "r_x3": 317.06, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 128.58799999999997, "r_x1": 425.378, "r_y1": 128.58799999999997, "r_x2": 425.378, "r_y2": 121.53399999999999, "r_x3": 417.856, "r_y3": 121.53399999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 128.58799999999997, "r_x1": 457.417, "r_y1": 128.58799999999997, "r_x2": 457.417, "r_y2": 121.53399999999999, "r_x3": 449.896, "r_y3": 121.53399999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 130.654, "r_x1": 496.326, "r_y1": 130.654, "r_x2": 496.326, "r_y2": 122.10199999999998, "r_x3": 476.401, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 130.654, "r_x1": 532.56, "r_y1": 130.654, "r_x2": 532.56, "r_y2": 122.10199999999998, "r_x3": 512.635, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 142.60900000000004, "r_x1": 375.172, "r_y1": 142.60900000000004, "r_x2": 375.172, "r_y2": 134.05700000000002, "r_x3": 317.06, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 140.543, "r_x1": 425.378, "r_y1": 140.543, "r_x2": 425.378, "r_y2": 133.48900000000003, "r_x3": 417.856, "r_y3": 133.48900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 140.543, "r_x1": 457.417, "r_y1": 140.543, "r_x2": 457.417, "r_y2": 133.48900000000003, "r_x3": 449.896, "r_y3": 133.48900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 142.60900000000004, "r_x1": 496.326, "r_y1": 142.60900000000004, "r_x2": 496.326, "r_y2": 134.05700000000002, "r_x3": 476.401, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 142.60900000000004, "r_x1": 532.56, "r_y1": 142.60900000000004, "r_x2": 532.56, "r_y2": 134.05700000000002, "r_x3": 512.635, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 154.56399999999996, "r_x1": 369.394, "r_y1": 154.56399999999996, "r_x2": 369.394, "r_y2": 146.01199999999994, "r_x3": 317.06, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 152.49800000000005, "r_x1": 425.378, "r_y1": 152.49800000000005, "r_x2": 425.378, "r_y2": 145.44399999999996, "r_x3": 417.856, "r_y3": 145.44399999999996, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 152.49800000000005, "r_x1": 457.417, "r_y1": 152.49800000000005, "r_x2": 457.417, "r_y2": 145.44399999999996, "r_x3": 449.896, "r_y3": 145.44399999999996, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 154.56399999999996, "r_x1": 496.326, "r_y1": 154.56399999999996, "r_x2": 496.326, "r_y2": 146.01199999999994, "r_x3": 476.401, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 154.56399999999996, "r_x1": 532.56, "r_y1": 154.56399999999996, "r_x2": 532.56, "r_y2": 146.01199999999994, "r_x3": 512.635, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 17, "label": "text", "bbox": {"l": 412.332, "t": 73.88300000000004, "r": 430.902, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.332, "r_y0": 82.43499999999995, "r_x1": 430.902, "r_y1": 82.43499999999995, "r_x2": 430.902, "r_y2": 73.88300000000004, "r_x3": 412.332, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 442.857, "t": 73.88300000000004, "r": 464.446, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.857, "r_y0": 82.43499999999995, "r_x1": 464.446, "r_y1": 82.43499999999995, "r_x2": 464.446, "r_y2": 73.88300000000004, "r_x3": 442.857, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 477.786, "t": 73.88300000000004, "r": 494.942, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.786, "r_y0": 82.43499999999995, "r_x1": 494.942, "r_y1": 82.43499999999995, "r_x2": 494.942, "r_y2": 73.88300000000004, "r_x3": 477.786, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 508.282, "t": 73.88300000000004, "r": 536.914, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 508.282, "r_y0": 82.43499999999995, "r_x1": 536.914, "r_y1": 82.43499999999995, "r_x2": 536.914, "r_y2": 73.88300000000004, "r_x3": 508.282, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 317.06, "t": 86.23599999999999, "r": 361.643, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 94.78800000000001, "r_x1": 361.643, "r_y1": 94.78800000000001, "r_x2": 361.643, "r_y2": 86.23599999999999, "r_x3": 317.06, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 417.856, "t": 85.668, "r": 425.378, "b": 92.72199999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 92.72199999999998, "r_x1": 425.378, "r_y1": 92.72199999999998, "r_x2": 425.378, "r_y2": 85.668, "r_x3": 417.856, "r_y3": 85.668, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 449.896, "t": 85.668, "r": 457.417, "b": 92.72199999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 92.72199999999998, "r_x1": 457.417, "r_y1": 92.72199999999998, "r_x2": 457.417, "r_y2": 85.668, "r_x3": 449.896, "r_y3": 85.668, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 476.401, "t": 86.23599999999999, "r": 496.326, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 94.78800000000001, "r_x1": 496.326, "r_y1": 94.78800000000001, "r_x2": 496.326, "r_y2": 86.23599999999999, "r_x3": 476.401, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 512.635, "t": 86.23599999999999, "r": 532.56, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 94.78800000000001, "r_x1": 532.56, "r_y1": 94.78800000000001, "r_x2": 532.56, "r_y2": 86.23599999999999, "r_x3": 512.635, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 317.06, "t": 98.19100000000003, "r": 359.431, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 106.74300000000005, "r_x1": 359.431, "r_y1": 106.74300000000005, "r_x2": 359.431, "r_y2": 98.19100000000003, "r_x3": 317.06, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 417.856, "t": 97.62300000000005, "r": 425.378, "b": 104.67700000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 104.67700000000002, "r_x1": 425.378, "r_y1": 104.67700000000002, "r_x2": 425.378, "r_y2": 97.62300000000005, "r_x3": 417.856, "r_y3": 97.62300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 449.896, "t": 97.62300000000005, "r": 457.417, "b": 104.67700000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 104.67700000000002, "r_x1": 457.417, "r_y1": 104.67700000000002, "r_x2": 457.417, "r_y2": 97.62300000000005, "r_x3": 449.896, "r_y3": 97.62300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 476.401, "t": 98.19100000000003, "r": 496.326, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 106.74300000000005, "r_x1": 496.326, "r_y1": 106.74300000000005, "r_x2": 496.326, "r_y2": 98.19100000000003, "r_x3": 476.401, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 513.462, "t": 98.19100000000003, "r": 531.733, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.462, "r_y0": 106.74300000000005, "r_x1": 531.733, "r_y1": 106.74300000000005, "r_x2": 531.733, "r_y2": 98.19100000000003, "r_x3": 513.462, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 317.06, "t": 110.14700000000005, "r": 359.979, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 118.69899999999996, "r_x1": 359.979, "r_y1": 118.69899999999996, "r_x2": 359.979, "r_y2": 110.14700000000005, "r_x3": 317.06, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 417.856, "t": 109.57899999999995, "r": 425.378, "b": 116.63300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 116.63300000000004, "r_x1": 425.378, "r_y1": 116.63300000000004, "r_x2": 425.378, "r_y2": 109.57899999999995, "r_x3": 417.856, "r_y3": 109.57899999999995, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 450.812, "t": 109.57899999999995, "r": 456.501, "b": 116.63300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.812, "r_y0": 116.63300000000004, "r_x1": 456.501, "r_y1": 116.63300000000004, "r_x2": 456.501, "r_y2": 109.57899999999995, "r_x3": 450.812, "r_y3": 109.57899999999995, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 476.401, "t": 110.14700000000005, "r": 496.326, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 118.69899999999996, "r_x1": 496.326, "r_y1": 118.69899999999996, "r_x2": 496.326, "r_y2": 110.14700000000005, "r_x3": 476.401, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 511.25, "t": 110.14700000000005, "r": 533.945, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 511.25, "r_y0": 118.69899999999996, "r_x1": 533.945, "r_y1": 118.69899999999996, "r_x2": 533.945, "r_y2": 110.14700000000005, "r_x3": 511.25, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 317.06, "t": 122.10199999999998, "r": 400.377, "b": 130.654, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 130.654, "r_x1": 400.377, "r_y1": 130.654, "r_x2": 400.377, "r_y2": 122.10199999999998, "r_x3": 317.06, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 417.856, "t": 121.53399999999999, "r": 425.378, "b": 128.58799999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 128.58799999999997, "r_x1": 425.378, "r_y1": 128.58799999999997, "r_x2": 425.378, "r_y2": 121.53399999999999, "r_x3": 417.856, "r_y3": 121.53399999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 449.896, "t": 121.53399999999999, "r": 457.417, "b": 128.58799999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 128.58799999999997, "r_x1": 457.417, "r_y1": 128.58799999999997, "r_x2": 457.417, "r_y2": 121.53399999999999, "r_x3": 449.896, "r_y3": 121.53399999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 476.401, "t": 122.10199999999998, "r": 496.326, "b": 130.654, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 130.654, "r_x1": 496.326, "r_y1": 130.654, "r_x2": 496.326, "r_y2": 122.10199999999998, "r_x3": 476.401, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 512.635, "t": 122.10199999999998, "r": 532.56, "b": 130.654, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 130.654, "r_x1": 532.56, "r_y1": 130.654, "r_x2": 532.56, "r_y2": 122.10199999999998, "r_x3": 512.635, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 317.06, "t": 134.05700000000002, "r": 375.172, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 142.60900000000004, "r_x1": 375.172, "r_y1": 142.60900000000004, "r_x2": 375.172, "r_y2": 134.05700000000002, "r_x3": 317.06, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 417.856, "t": 133.48900000000003, "r": 425.378, "b": 140.543, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 140.543, "r_x1": 425.378, "r_y1": 140.543, "r_x2": 425.378, "r_y2": 133.48900000000003, "r_x3": 417.856, "r_y3": 133.48900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 449.896, "t": 133.48900000000003, "r": 457.417, "b": 140.543, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 140.543, "r_x1": 457.417, "r_y1": 140.543, "r_x2": 457.417, "r_y2": 133.48900000000003, "r_x3": 449.896, "r_y3": 133.48900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 476.401, "t": 134.05700000000002, "r": 496.326, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 142.60900000000004, "r_x1": 496.326, "r_y1": 142.60900000000004, "r_x2": 496.326, "r_y2": 134.05700000000002, "r_x3": 476.401, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 512.635, "t": 134.05700000000002, "r": 532.56, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 142.60900000000004, "r_x1": 532.56, "r_y1": 142.60900000000004, "r_x2": 532.56, "r_y2": 134.05700000000002, "r_x3": 512.635, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 317.06, "t": 146.01199999999994, "r": 369.394, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 154.56399999999996, "r_x1": 369.394, "r_y1": 154.56399999999996, "r_x2": 369.394, "r_y2": 146.01199999999994, "r_x3": 317.06, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 417.856, "t": 145.44399999999996, "r": 425.378, "b": 152.49800000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 152.49800000000005, "r_x1": 425.378, "r_y1": 152.49800000000005, "r_x2": 425.378, "r_y2": 145.44399999999996, "r_x3": 417.856, "r_y3": 145.44399999999996, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 449.896, "t": 145.44399999999996, "r": 457.417, "b": 152.49800000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 152.49800000000005, "r_x1": 457.417, "r_y1": 152.49800000000005, "r_x2": 457.417, "r_y2": 145.44399999999996, "r_x3": 449.896, "r_y3": 145.44399999999996, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 476.401, "t": 146.01199999999994, "r": 496.326, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 154.56399999999996, "r_x1": 496.326, "r_y1": 154.56399999999996, "r_x2": 496.326, "r_y2": 146.01199999999994, "r_x3": 476.401, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 512.635, "t": 146.01199999999994, "r": 532.56, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 154.56399999999996, "r_x1": 532.56, "r_y1": 154.56399999999996, "r_x2": 532.56, "r_y2": 146.01199999999994, "r_x3": 512.635, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 7, "num_cols": 5, "table_cells": [{"bbox": {"l": 412.332, "t": 73.88300000000004, "r": 430.902, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Tags", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 442.857, "t": 73.88300000000004, "r": 464.446, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Bbox", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 477.786, "t": 73.88300000000004, "r": 494.942, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "Size", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 508.282, "t": 73.88300000000004, "r": 536.914, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "Format", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 317.06, "t": 86.23599999999999, "r": 361.643, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 417.856, "t": 85.668, "r": 425.378, "b": 92.72199999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 449.896, "t": 85.668, "r": 457.417, "b": 92.72199999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 476.401, "t": 86.23599999999999, "r": 496.326, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "509k", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 512.635, "t": 86.23599999999999, "r": 532.56, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 317.06, "t": 98.19100000000003, "r": 359.431, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 417.856, "t": 97.62300000000005, "r": 425.378, "b": 104.67700000000002, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 449.896, "t": 97.62300000000005, "r": 457.417, "b": 104.67700000000002, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 476.401, "t": 98.19100000000003, "r": 496.326, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "112k", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 513.462, "t": 98.19100000000003, "r": 531.733, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PDF", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 317.06, "t": 110.14700000000005, "r": 359.979, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableBank", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 417.856, "t": 109.57899999999995, "r": 425.378, "b": 116.63300000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 450.812, "t": 109.57899999999995, "r": 456.501, "b": 116.63300000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "7", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 476.401, "t": 110.14700000000005, "r": 496.326, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "145k", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 511.25, "t": 110.14700000000005, "r": 533.945, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "JPEG", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 317.06, "t": 122.10199999999998, "r": 400.377, "b": 130.654, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Combined-Tabnet(*)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 417.856, "t": 121.53399999999999, "r": 425.378, "b": 128.58799999999997, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 449.896, "t": 121.53399999999999, "r": 457.417, "b": 128.58799999999997, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 476.401, "t": 122.10199999999998, "r": 496.326, "b": 130.654, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "400k", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 512.635, "t": 122.10199999999998, "r": 532.56, "b": 130.654, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 317.06, "t": 134.05700000000002, "r": 375.172, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Combined(**)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 417.856, "t": 133.48900000000003, "r": 425.378, "b": 140.543, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 449.896, "t": 133.48900000000003, "r": 457.417, "b": 140.543, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 476.401, "t": 134.05700000000002, "r": 496.326, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "500k", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 512.635, "t": 134.05700000000002, "r": 532.56, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 317.06, "t": 146.01199999999994, "r": 369.394, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "SynthTabNet", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 417.856, "t": 145.44399999999996, "r": 425.378, "b": 152.49800000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 449.896, "t": 145.44399999999996, "r": 457.417, "b": 152.49800000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 476.401, "t": 146.01199999999994, "r": 496.326, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "600k", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 512.635, "t": 146.01199999999994, "r": 532.56, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false}]}}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "text", "id": 10, "page_no": 3, "cluster": {"id": 10, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 286.365, "b": 95.98400000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9611433148384094, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "amount of such tables, and kept only those ones ranging", "orig": "amount of such tables, and kept only those ones ranging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 95.98400000000004, "r_x1": 212.283, "r_y1": 95.98400000000004, "r_x2": 212.283, "r_y2": 87.43200000000002, "r_x3": 50.112, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "between 1*1 and 20*10 (rows/columns).", "orig": "between 1*1 and 20*10 (rows/columns).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "amount of such tables, and kept only those ones ranging between 1*1 and 20*10 (rows/columns)."}, {"label": "text", "id": 1, "page_no": 3, "cluster": {"id": 1, "label": "text", "bbox": {"l": 50.112, "t": 101.22900000000004, "r": 286.365, "b": 313.019, "coord_origin": "TOPLEFT"}, "confidence": 0.988013744354248, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 109.78099999999995, "r_x1": 286.365, "r_y1": 109.78099999999995, "r_x2": 286.365, "r_y2": 101.22900000000004, "r_x3": 62.067, "r_y3": 101.22900000000004, "coord_origin": "TOPLEFT"}, "text": "The availability of the bounding boxes for all table cells", "orig": "The availability of the bounding boxes for all table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 121.73599999999999, "r_x1": 176.458, "r_y1": 121.73599999999999, "r_x2": 176.458, "r_y2": 113.18399999999997, "r_x3": 50.112, "r_y3": 113.18399999999997, "coord_origin": "TOPLEFT"}, "text": "is essential to train our models.", "orig": "is essential to train our models.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.971, "r_y0": 121.73599999999999, "r_x1": 286.365, "r_y1": 121.73599999999999, "r_x2": 286.365, "r_y2": 113.18399999999997, "r_x3": 180.971, "r_y3": 113.18399999999997, "coord_origin": "TOPLEFT"}, "text": "In order to distinguish be-", "orig": "In order to distinguish be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 133.69100000000003, "r_x1": 286.365, "r_y1": 133.69100000000003, "r_x2": 286.365, "r_y2": 125.13900000000001, "r_x3": 50.112, "r_y3": 125.13900000000001, "coord_origin": "TOPLEFT"}, "text": "tween empty and non-empty bounding boxes, we have in-", "orig": "tween empty and non-empty bounding boxes, we have in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 145.64700000000005, "r_x1": 286.365, "r_y1": 145.64700000000005, "r_x2": 286.365, "r_y2": 137.09500000000003, "r_x3": 50.112, "r_y3": 137.09500000000003, "coord_origin": "TOPLEFT"}, "text": "troduced a binary class in the annotation. Unfortunately, the", "orig": "troduced a binary class in the annotation. Unfortunately, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 157.60199999999998, "r_x1": 286.365, "r_y1": 157.60199999999998, "r_x2": 286.365, "r_y2": 149.04999999999995, "r_x3": 50.112, "r_y3": 149.04999999999995, "coord_origin": "TOPLEFT"}, "text": "original datasets either omit the bounding boxes for whole", "orig": "original datasets either omit the bounding boxes for whole", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 169.55700000000002, "r_x1": 94.127, "r_y1": 169.55700000000002, "r_x2": 94.127, "r_y2": 161.005, "r_x3": 50.112, "r_y3": 161.005, "coord_origin": "TOPLEFT"}, "text": "tables (e.g.", "orig": "tables (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 98.959, "r_y0": 169.55700000000002, "r_x1": 286.365, "r_y1": 169.55700000000002, "r_x2": 286.365, "r_y2": 161.005, "r_x3": 98.959, "r_y3": 161.005, "coord_origin": "TOPLEFT"}, "text": "TableBank) or they narrow their scope only to", "orig": "TableBank) or they narrow their scope only to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 181.51199999999994, "r_x1": 116.951, "r_y1": 181.51199999999994, "r_x2": 116.951, "r_y2": 172.96000000000004, "r_x3": 50.112, "r_y3": 172.96000000000004, "coord_origin": "TOPLEFT"}, "text": "non-empty cells.", "orig": "non-empty cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 121.345, "r_y0": 181.51199999999994, "r_x1": 286.365, "r_y1": 181.51199999999994, "r_x2": 286.365, "r_y2": 172.96000000000004, "r_x3": 121.345, "r_y3": 172.96000000000004, "coord_origin": "TOPLEFT"}, "text": "Therefore, it was imperative to introduce", "orig": "Therefore, it was imperative to introduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 193.46699999999998, "r_x1": 286.365, "r_y1": 193.46699999999998, "r_x2": 286.365, "r_y2": 184.91499999999996, "r_x3": 50.112, "r_y3": 184.91499999999996, "coord_origin": "TOPLEFT"}, "text": "a data pre-processing procedure that generates the missing", "orig": "a data pre-processing procedure that generates the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 205.423, "r_x1": 286.365, "r_y1": 205.423, "r_x2": 286.365, "r_y2": 196.87099999999998, "r_x3": 50.112, "r_y3": 196.87099999999998, "coord_origin": "TOPLEFT"}, "text": "bounding boxes out of the annotation information. This pro-", "orig": "bounding boxes out of the annotation information. This pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 217.37800000000004, "r_x1": 286.365, "r_y1": 217.37800000000004, "r_x2": 286.365, "r_y2": 208.82600000000002, "r_x3": 50.112, "r_y3": 208.82600000000002, "coord_origin": "TOPLEFT"}, "text": "cedure first parses the provided table structure and calcu-", "orig": "cedure first parses the provided table structure and calcu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 229.33299999999997, "r_x1": 286.365, "r_y1": 229.33299999999997, "r_x2": 286.365, "r_y2": 220.78099999999995, "r_x3": 50.112, "r_y3": 220.78099999999995, "coord_origin": "TOPLEFT"}, "text": "lates the dimensions of the most fine-grained grid that cov-", "orig": "lates the dimensions of the most fine-grained grid that cov-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 241.288, "r_x1": 139.805, "r_y1": 241.288, "r_x2": 139.805, "r_y2": 232.736, "r_x3": 50.112, "r_y3": 232.736, "coord_origin": "TOPLEFT"}, "text": "ers the table structure.", "orig": "ers the table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 144.607, "r_y0": 241.288, "r_x1": 286.365, "r_y1": 241.288, "r_x2": 286.365, "r_y2": 232.736, "r_x3": 144.607, "r_y3": 232.736, "coord_origin": "TOPLEFT"}, "text": "Notice that each table cell may oc-", "orig": "Notice that each table cell may oc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 253.24300000000005, "r_x1": 286.365, "r_y1": 253.24300000000005, "r_x2": 286.365, "r_y2": 244.69100000000003, "r_x3": 50.112, "r_y3": 244.69100000000003, "coord_origin": "TOPLEFT"}, "text": "cupy multiple grid squares due to row or column spans. In", "orig": "cupy multiple grid squares due to row or column spans. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 265.198, "r_x1": 286.365, "r_y1": 265.198, "r_x2": 286.365, "r_y2": 256.64599999999996, "r_x3": 50.112, "r_y3": 256.64599999999996, "coord_origin": "TOPLEFT"}, "text": "case of PubTabNet we had to compute missing bounding", "orig": "case of PubTabNet we had to compute missing bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 277.154, "r_x1": 286.365, "r_y1": 277.154, "r_x2": 286.365, "r_y2": 268.602, "r_x3": 50.112, "r_y3": 268.602, "coord_origin": "TOPLEFT"}, "text": "boxes for 48% of the simple and 69% of the complex ta-", "orig": "boxes for 48% of the simple and 69% of the complex ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 289.109, "r_x1": 68.652, "r_y1": 289.109, "r_x2": 68.652, "r_y2": 280.557, "r_x3": 50.112, "r_y3": 280.557, "coord_origin": "TOPLEFT"}, "text": "bles.", "orig": "bles.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 75.566, "r_y0": 289.109, "r_x1": 286.365, "r_y1": 289.109, "r_x2": 286.365, "r_y2": 280.557, "r_x3": 75.566, "r_y3": 280.557, "coord_origin": "TOPLEFT"}, "text": "Regarding FinTabNet, 68% of the simple and 98%", "orig": "Regarding FinTabNet, 68% of the simple and 98%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 301.064, "r_x1": 286.365, "r_y1": 301.064, "r_x2": 286.365, "r_y2": 292.512, "r_x3": 50.112, "r_y3": 292.512, "coord_origin": "TOPLEFT"}, "text": "of the complex tables require the generation of bounding", "orig": "of the complex tables require the generation of bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 313.019, "r_x1": 75.696, "r_y1": 313.019, "r_x2": 75.696, "r_y2": 304.467, "r_x3": 50.112, "r_y3": 304.467, "coord_origin": "TOPLEFT"}, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The availability of the bounding boxes for all table cells is essential to train our models. In order to distinguish between empty and non-empty bounding boxes, we have introduced a binary class in the annotation. Unfortunately, the original datasets either omit the bounding boxes for whole tables (e.g. TableBank) or they narrow their scope only to non-empty cells. Therefore, it was imperative to introduce a data pre-processing procedure that generates the missing bounding boxes out of the annotation information. This procedure first parses the provided table structure and calculates the dimensions of the most fine-grained grid that covers the table structure. Notice that each table cell may occupy multiple grid squares due to row or column spans. In case of PubTabNet we had to compute missing bounding boxes for 48% of the simple and 69% of the complex tables. Regarding FinTabNet, 68% of the simple and 98% of the complex tables require the generation of bounding boxes."}, {"label": "text", "id": 4, "page_no": 3, "cluster": {"id": 4, "label": "text", "bbox": {"l": 50.112, "t": 318.264, "r": 286.365, "b": 434.413, "coord_origin": "TOPLEFT"}, "confidence": 0.9873981475830078, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 326.816, "r_x1": 286.365, "r_y1": 326.816, "r_x2": 286.365, "r_y2": 318.264, "r_x3": 62.067, "r_y3": 318.264, "coord_origin": "TOPLEFT"}, "text": "As it is illustrated in Fig. 2, the table distributions from", "orig": "As it is illustrated in Fig. 2, the table distributions from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 338.772, "r_x1": 60.075, "r_y1": 338.772, "r_x2": 60.075, "r_y2": 330.22, "r_x3": 50.112, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.146, "r_y0": 338.772, "r_x1": 96.687, "r_y1": 338.772, "r_x2": 96.687, "r_y2": 330.22, "r_x3": 65.146, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "datasets", "orig": "datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.768, "r_y0": 338.772, "r_x1": 113.932, "r_y1": 338.772, "r_x2": 113.932, "r_y2": 330.22, "r_x3": 101.768, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "are", "orig": "are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.003, "r_y0": 338.772, "r_x1": 148.533, "r_y1": 338.772, "r_x2": 148.533, "r_y2": 330.22, "r_x3": 119.003, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "skewed", "orig": "skewed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.613, "r_y0": 338.772, "r_x1": 184.806, "r_y1": 338.772, "r_x2": 184.806, "r_y2": 330.22, "r_x3": 153.613, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "towards", "orig": "towards", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 189.877, "r_y0": 338.772, "r_x1": 219.765, "r_y1": 338.772, "r_x2": 219.765, "r_y2": 330.22, "r_x3": 189.877, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "simpler", "orig": "simpler", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.836, "r_y0": 338.772, "r_x1": 263.571, "r_y1": 338.772, "r_x2": 263.571, "r_y2": 330.22, "r_x3": 224.836, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "structures", "orig": "structures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 268.652, "r_y0": 338.772, "r_x1": 286.365, "r_y1": 338.772, "r_x2": 286.365, "r_y2": 330.22, "r_x3": 268.652, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 350.727, "r_x1": 286.365, "r_y1": 350.727, "r_x2": 286.365, "r_y2": 342.175, "r_x3": 50.112, "r_y3": 342.175, "coord_origin": "TOPLEFT"}, "text": "fewer number of rows/columns. Additionally, there is very", "orig": "fewer number of rows/columns. Additionally, there is very", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 362.682, "r_x1": 286.365, "r_y1": 362.682, "r_x2": 286.365, "r_y2": 354.13, "r_x3": 50.112, "r_y3": 354.13, "coord_origin": "TOPLEFT"}, "text": "limited variance in the table styles, which in case of Pub-", "orig": "limited variance in the table styles, which in case of Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 374.637, "r_x1": 286.365, "r_y1": 374.637, "r_x2": 286.365, "r_y2": 366.085, "r_x3": 50.112, "r_y3": 366.085, "coord_origin": "TOPLEFT"}, "text": "TabNet and FinTabNet means one styling format for the", "orig": "TabNet and FinTabNet means one styling format for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 386.592, "r_x1": 141.589, "r_y1": 386.592, "r_x2": 141.589, "r_y2": 378.04, "r_x3": 50.112, "r_y3": 378.04, "coord_origin": "TOPLEFT"}, "text": "majority of the tables.", "orig": "majority of the tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.702, "r_y0": 386.592, "r_x1": 286.365, "r_y1": 386.592, "r_x2": 286.365, "r_y2": 378.04, "r_x3": 148.702, "r_y3": 378.04, "coord_origin": "TOPLEFT"}, "text": "Similar limitations appear also in", "orig": "Similar limitations appear also in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 398.547, "r_x1": 286.365, "r_y1": 398.547, "r_x2": 286.365, "r_y2": 389.995, "r_x3": 50.112, "r_y3": 389.995, "coord_origin": "TOPLEFT"}, "text": "the type of table content, which in some cases (e.g. FinTab-", "orig": "the type of table content, which in some cases (e.g. FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 410.503, "r_x1": 201.822, "r_y1": 410.503, "r_x2": 201.822, "r_y2": 401.951, "r_x3": 50.112, "r_y3": 401.951, "coord_origin": "TOPLEFT"}, "text": "Net) is restricted to a certain domain.", "orig": "Net) is restricted to a certain domain.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.764, "r_y0": 410.503, "r_x1": 286.365, "r_y1": 410.503, "r_x2": 286.365, "r_y2": 401.951, "r_x3": 206.764, "r_y3": 401.951, "coord_origin": "TOPLEFT"}, "text": "Ultimately, the lack", "orig": "Ultimately, the lack", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 422.458, "r_x1": 286.365, "r_y1": 422.458, "r_x2": 286.365, "r_y2": 413.906, "r_x3": 50.112, "r_y3": 413.906, "coord_origin": "TOPLEFT"}, "text": "of diversity in the training dataset damages the ability of the", "orig": "of diversity in the training dataset damages the ability of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 434.413, "r_x1": 216.398, "r_y1": 434.413, "r_x2": 216.398, "r_y2": 425.861, "r_x3": 50.112, "r_y3": 425.861, "coord_origin": "TOPLEFT"}, "text": "models to generalize well on unseen data.", "orig": "models to generalize well on unseen data.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "As it is illustrated in Fig. 2, the table distributions from all datasets are skewed towards simpler structures with fewer number of rows/columns. Additionally, there is very limited variance in the table styles, which in case of PubTabNet and FinTabNet means one styling format for the majority of the tables. Similar limitations appear also in the type of table content, which in some cases (e.g. FinTabNet) is restricted to a certain domain. Ultimately, the lack of diversity in the training dataset damages the ability of the models to generalize well on unseen data."}, {"label": "text", "id": 3, "page_no": 3, "cluster": {"id": 3, "label": "text", "bbox": {"l": 50.112, "t": 439.658, "r": 286.367, "b": 627.538, "coord_origin": "TOPLEFT"}, "confidence": 0.9876030087471008, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 448.21, "r_x1": 286.365, "r_y1": 448.21, "r_x2": 286.365, "r_y2": 439.658, "r_x3": 62.067, "r_y3": 439.658, "coord_origin": "TOPLEFT"}, "text": "Motivated by those observations we aimed at generating", "orig": "Motivated by those observations we aimed at generating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 460.165, "r_x1": 172.144, "r_y1": 460.165, "r_x2": 172.144, "r_y2": 451.613, "r_x3": 50.112, "r_y3": 451.613, "coord_origin": "TOPLEFT"}, "text": "a synthetic table dataset named", "orig": "a synthetic table dataset named", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 174.148, "r_y0": 460.022, "r_x1": 224.708, "r_y1": 460.022, "r_x2": 224.708, "r_y2": 451.434, "r_x3": 174.148, "r_y3": 451.434, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.708, "r_y0": 460.165, "r_x1": 227.199, "r_y1": 460.165, "r_x2": 227.199, "r_y2": 451.613, "r_x3": 224.708, "r_y3": 451.613, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 230.128, "r_y0": 460.165, "r_x1": 286.367, "r_y1": 460.165, "r_x2": 286.367, "r_y2": 451.613, "r_x3": 230.128, "r_y3": 451.613, "coord_origin": "TOPLEFT"}, "text": "This approach", "orig": "This approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 472.121, "r_x1": 128.179, "r_y1": 472.121, "r_x2": 128.179, "r_y2": 463.569, "r_x3": 50.112, "r_y3": 463.569, "coord_origin": "TOPLEFT"}, "text": "offers control over:", "orig": "offers control over:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.971, "r_y0": 472.121, "r_x1": 286.365, "r_y1": 472.121, "r_x2": 286.365, "r_y2": 463.569, "r_x3": 132.971, "r_y3": 463.569, "coord_origin": "TOPLEFT"}, "text": "1) the size of the dataset, 2) the table", "orig": "1) the size of the dataset, 2) the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 484.076, "r_x1": 266.739, "r_y1": 484.076, "r_x2": 266.739, "r_y2": 475.524, "r_x3": 50.112, "r_y3": 475.524, "coord_origin": "TOPLEFT"}, "text": "structure, 3) the table style and 4) the type of content.", "orig": "structure, 3) the table style and 4) the type of content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.873, "r_y0": 484.076, "r_x1": 286.365, "r_y1": 484.076, "r_x2": 286.365, "r_y2": 475.524, "r_x3": 270.873, "r_y3": 475.524, "coord_origin": "TOPLEFT"}, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 496.031, "r_x1": 286.365, "r_y1": 496.031, "r_x2": 286.365, "r_y2": 487.479, "r_x3": 50.112, "r_y3": 487.479, "coord_origin": "TOPLEFT"}, "text": "complexity of the table structure is described by the size of", "orig": "complexity of the table structure is described by the size of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 507.986, "r_x1": 286.365, "r_y1": 507.986, "r_x2": 286.365, "r_y2": 499.434, "r_x3": 50.112, "r_y3": 499.434, "coord_origin": "TOPLEFT"}, "text": "the table header and the table body, as well as the percentage", "orig": "the table header and the table body, as well as the percentage", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 519.941, "r_x1": 286.365, "r_y1": 519.941, "r_x2": 286.365, "r_y2": 511.389, "r_x3": 50.112, "r_y3": 511.389, "coord_origin": "TOPLEFT"}, "text": "of the table cells covered by row spans and column spans.", "orig": "of the table cells covered by row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 531.8969999999999, "r_x1": 286.365, "r_y1": 531.8969999999999, "r_x2": 286.365, "r_y2": 523.345, "r_x3": 50.112, "r_y3": 523.345, "coord_origin": "TOPLEFT"}, "text": "A set of carefully designed styling templates provides the", "orig": "A set of carefully designed styling templates provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 543.852, "r_x1": 286.365, "r_y1": 543.852, "r_x2": 286.365, "r_y2": 535.3, "r_x3": 50.112, "r_y3": 535.3, "coord_origin": "TOPLEFT"}, "text": "basis to build a wide range of table appearances. Lastly, the", "orig": "basis to build a wide range of table appearances. Lastly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 555.807, "r_x1": 286.365, "r_y1": 555.807, "r_x2": 286.365, "r_y2": 547.255, "r_x3": 50.112, "r_y3": 547.255, "coord_origin": "TOPLEFT"}, "text": "table content is generated out of a curated collection of text", "orig": "table content is generated out of a curated collection of text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 567.762, "r_x1": 83.028, "r_y1": 567.762, "r_x2": 83.028, "r_y2": 559.21, "r_x3": 50.112, "r_y3": 559.21, "coord_origin": "TOPLEFT"}, "text": "corpora.", "orig": "corpora.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.153, "r_y0": 567.762, "r_x1": 286.365, "r_y1": 567.762, "r_x2": 286.365, "r_y2": 559.21, "r_x3": 87.153, "r_y3": 559.21, "coord_origin": "TOPLEFT"}, "text": "By controlling the size and scope of the synthetic", "orig": "By controlling the size and scope of the synthetic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 579.717, "r_x1": 286.365, "r_y1": 579.717, "r_x2": 286.365, "r_y2": 571.165, "r_x3": 50.112, "r_y3": 571.165, "coord_origin": "TOPLEFT"}, "text": "datasets we are able to train and evaluate our models in a", "orig": "datasets we are able to train and evaluate our models in a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 591.672, "r_x1": 174.645, "r_y1": 591.672, "r_x2": 174.645, "r_y2": 583.12, "r_x3": 50.112, "r_y3": 583.12, "coord_origin": "TOPLEFT"}, "text": "variety of different conditions.", "orig": "variety of different conditions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.021, "r_y0": 591.672, "r_x1": 286.365, "r_y1": 591.672, "r_x2": 286.365, "r_y2": 583.12, "r_x3": 181.021, "r_y3": 583.12, "coord_origin": "TOPLEFT"}, "text": "For example, we can first", "orig": "For example, we can first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 603.6279999999999, "r_x1": 286.365, "r_y1": 603.6279999999999, "r_x2": 286.365, "r_y2": 595.076, "r_x3": 50.112, "r_y3": 595.076, "coord_origin": "TOPLEFT"}, "text": "generate a highly diverse dataset to train our models and", "orig": "generate a highly diverse dataset to train our models and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 615.583, "r_x1": 286.365, "r_y1": 615.583, "r_x2": 286.365, "r_y2": 607.031, "r_x3": 50.112, "r_y3": 607.031, "coord_origin": "TOPLEFT"}, "text": "then evaluate their performance on other synthetic datasets", "orig": "then evaluate their performance on other synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 627.538, "r_x1": 209.753, "r_y1": 627.538, "r_x2": 209.753, "r_y2": 618.986, "r_x3": 50.112, "r_y3": 618.986, "coord_origin": "TOPLEFT"}, "text": "which are focused on a specific domain.", "orig": "which are focused on a specific domain.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Motivated by those observations we aimed at generating a synthetic table dataset named SynthTabNet . This approach offers control over: 1) the size of the dataset, 2) the table structure, 3) the table style and 4) the type of content. The complexity of the table structure is described by the size of the table header and the table body, as well as the percentage of the table cells covered by row spans and column spans. A set of carefully designed styling templates provides the basis to build a wide range of table appearances. Lastly, the table content is generated out of a curated collection of text corpora. By controlling the size and scope of the synthetic datasets we are able to train and evaluate our models in a variety of different conditions. For example, we can first generate a highly diverse dataset to train our models and then evaluate their performance on other synthetic datasets which are focused on a specific domain."}, {"label": "text", "id": 5, "page_no": 3, "cluster": {"id": 5, "label": "text", "bbox": {"l": 50.112, "t": 632.783, "r": 286.365, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9871614575386047, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 641.335, "r_x1": 286.365, "r_y1": 641.335, "r_x2": 286.365, "r_y2": 632.783, "r_x3": 62.067, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "In this regard, we have prepared four synthetic datasets,", "orig": "In this regard, we have prepared four synthetic datasets,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 653.29, "r_x1": 286.365, "r_y1": 653.29, "r_x2": 286.365, "r_y2": 644.738, "r_x3": 50.112, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "each one containing 150k examples. The corpora to gener-", "orig": "each one containing 150k examples. The corpora to gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 665.246, "r_x1": 286.365, "r_y1": 665.246, "r_x2": 286.365, "r_y2": 656.694, "r_x3": 50.112, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "ate the table text consists of the most frequent terms appear-", "orig": "ate the table text consists of the most frequent terms appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.201, "r_x1": 286.365, "r_y1": 677.201, "r_x2": 286.365, "r_y2": 668.649, "r_x3": 50.112, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "ing in PubTabNet and FinTabNet together with randomly", "orig": "ing in PubTabNet and FinTabNet together with randomly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 109.519, "r_y1": 689.156, "r_x2": 109.519, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "generated text.", "orig": "generated text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 115.337, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 115.337, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "The first two synthetic datasets have been", "orig": "The first two synthetic datasets have been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "fine-tuned to mimic the appearance of the original datasets", "orig": "fine-tuned to mimic the appearance of the original datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "but encompass more complicated table structures. The third", "orig": "but encompass more complicated table structures. The third", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In this regard, we have prepared four synthetic datasets, each one containing 150k examples. The corpora to generate the table text consists of the most frequent terms appearing in PubTabNet and FinTabNet together with randomly generated text. The first two synthetic datasets have been fine-tuned to mimic the appearance of the original datasets but encompass more complicated table structures. The third"}, {"label": "table", "id": 8, "page_no": 3, "cluster": {"id": 8, "label": "table", "bbox": {"l": 310.67584228515625, "t": 73.19388580322266, "r": 542.9547119140625, "b": 155.22052001953125, "coord_origin": "TOPLEFT"}, "confidence": 0.9777463674545288, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.332, "r_y0": 82.43499999999995, "r_x1": 430.902, "r_y1": 82.43499999999995, "r_x2": 430.902, "r_y2": 73.88300000000004, "r_x3": 412.332, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.857, "r_y0": 82.43499999999995, "r_x1": 464.446, "r_y1": 82.43499999999995, "r_x2": 464.446, "r_y2": 73.88300000000004, "r_x3": 442.857, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.786, "r_y0": 82.43499999999995, "r_x1": 494.942, "r_y1": 82.43499999999995, "r_x2": 494.942, "r_y2": 73.88300000000004, "r_x3": 477.786, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 508.282, "r_y0": 82.43499999999995, "r_x1": 536.914, "r_y1": 82.43499999999995, "r_x2": 536.914, "r_y2": 73.88300000000004, "r_x3": 508.282, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 94.78800000000001, "r_x1": 361.643, "r_y1": 94.78800000000001, "r_x2": 361.643, "r_y2": 86.23599999999999, "r_x3": 317.06, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 92.72199999999998, "r_x1": 425.378, "r_y1": 92.72199999999998, "r_x2": 425.378, "r_y2": 85.668, "r_x3": 417.856, "r_y3": 85.668, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 92.72199999999998, "r_x1": 457.417, "r_y1": 92.72199999999998, "r_x2": 457.417, "r_y2": 85.668, "r_x3": 449.896, "r_y3": 85.668, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 94.78800000000001, "r_x1": 496.326, "r_y1": 94.78800000000001, "r_x2": 496.326, "r_y2": 86.23599999999999, "r_x3": 476.401, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 94.78800000000001, "r_x1": 532.56, "r_y1": 94.78800000000001, "r_x2": 532.56, "r_y2": 86.23599999999999, "r_x3": 512.635, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 106.74300000000005, "r_x1": 359.431, "r_y1": 106.74300000000005, "r_x2": 359.431, "r_y2": 98.19100000000003, "r_x3": 317.06, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 104.67700000000002, "r_x1": 425.378, "r_y1": 104.67700000000002, "r_x2": 425.378, "r_y2": 97.62300000000005, "r_x3": 417.856, "r_y3": 97.62300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 104.67700000000002, "r_x1": 457.417, "r_y1": 104.67700000000002, "r_x2": 457.417, "r_y2": 97.62300000000005, "r_x3": 449.896, "r_y3": 97.62300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 106.74300000000005, "r_x1": 496.326, "r_y1": 106.74300000000005, "r_x2": 496.326, "r_y2": 98.19100000000003, "r_x3": 476.401, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.462, "r_y0": 106.74300000000005, "r_x1": 531.733, "r_y1": 106.74300000000005, "r_x2": 531.733, "r_y2": 98.19100000000003, "r_x3": 513.462, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 118.69899999999996, "r_x1": 359.979, "r_y1": 118.69899999999996, "r_x2": 359.979, "r_y2": 110.14700000000005, "r_x3": 317.06, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 116.63300000000004, "r_x1": 425.378, "r_y1": 116.63300000000004, "r_x2": 425.378, "r_y2": 109.57899999999995, "r_x3": 417.856, "r_y3": 109.57899999999995, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.812, "r_y0": 116.63300000000004, "r_x1": 456.501, "r_y1": 116.63300000000004, "r_x2": 456.501, "r_y2": 109.57899999999995, "r_x3": 450.812, "r_y3": 109.57899999999995, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 118.69899999999996, "r_x1": 496.326, "r_y1": 118.69899999999996, "r_x2": 496.326, "r_y2": 110.14700000000005, "r_x3": 476.401, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 511.25, "r_y0": 118.69899999999996, "r_x1": 533.945, "r_y1": 118.69899999999996, "r_x2": 533.945, "r_y2": 110.14700000000005, "r_x3": 511.25, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 130.654, "r_x1": 400.377, "r_y1": 130.654, "r_x2": 400.377, "r_y2": 122.10199999999998, "r_x3": 317.06, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 128.58799999999997, "r_x1": 425.378, "r_y1": 128.58799999999997, "r_x2": 425.378, "r_y2": 121.53399999999999, "r_x3": 417.856, "r_y3": 121.53399999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 128.58799999999997, "r_x1": 457.417, "r_y1": 128.58799999999997, "r_x2": 457.417, "r_y2": 121.53399999999999, "r_x3": 449.896, "r_y3": 121.53399999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 130.654, "r_x1": 496.326, "r_y1": 130.654, "r_x2": 496.326, "r_y2": 122.10199999999998, "r_x3": 476.401, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 130.654, "r_x1": 532.56, "r_y1": 130.654, "r_x2": 532.56, "r_y2": 122.10199999999998, "r_x3": 512.635, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 142.60900000000004, "r_x1": 375.172, "r_y1": 142.60900000000004, "r_x2": 375.172, "r_y2": 134.05700000000002, "r_x3": 317.06, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 140.543, "r_x1": 425.378, "r_y1": 140.543, "r_x2": 425.378, "r_y2": 133.48900000000003, "r_x3": 417.856, "r_y3": 133.48900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 140.543, "r_x1": 457.417, "r_y1": 140.543, "r_x2": 457.417, "r_y2": 133.48900000000003, "r_x3": 449.896, "r_y3": 133.48900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 142.60900000000004, "r_x1": 496.326, "r_y1": 142.60900000000004, "r_x2": 496.326, "r_y2": 134.05700000000002, "r_x3": 476.401, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 142.60900000000004, "r_x1": 532.56, "r_y1": 142.60900000000004, "r_x2": 532.56, "r_y2": 134.05700000000002, "r_x3": 512.635, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 154.56399999999996, "r_x1": 369.394, "r_y1": 154.56399999999996, "r_x2": 369.394, "r_y2": 146.01199999999994, "r_x3": 317.06, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 152.49800000000005, "r_x1": 425.378, "r_y1": 152.49800000000005, "r_x2": 425.378, "r_y2": 145.44399999999996, "r_x3": 417.856, "r_y3": 145.44399999999996, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 152.49800000000005, "r_x1": 457.417, "r_y1": 152.49800000000005, "r_x2": 457.417, "r_y2": 145.44399999999996, "r_x3": 449.896, "r_y3": 145.44399999999996, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 154.56399999999996, "r_x1": 496.326, "r_y1": 154.56399999999996, "r_x2": 496.326, "r_y2": 146.01199999999994, "r_x3": 476.401, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 154.56399999999996, "r_x1": 532.56, "r_y1": 154.56399999999996, "r_x2": 532.56, "r_y2": 146.01199999999994, "r_x3": 512.635, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 17, "label": "text", "bbox": {"l": 412.332, "t": 73.88300000000004, "r": 430.902, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.332, "r_y0": 82.43499999999995, "r_x1": 430.902, "r_y1": 82.43499999999995, "r_x2": 430.902, "r_y2": 73.88300000000004, "r_x3": 412.332, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 442.857, "t": 73.88300000000004, "r": 464.446, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.857, "r_y0": 82.43499999999995, "r_x1": 464.446, "r_y1": 82.43499999999995, "r_x2": 464.446, "r_y2": 73.88300000000004, "r_x3": 442.857, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 477.786, "t": 73.88300000000004, "r": 494.942, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.786, "r_y0": 82.43499999999995, "r_x1": 494.942, "r_y1": 82.43499999999995, "r_x2": 494.942, "r_y2": 73.88300000000004, "r_x3": 477.786, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 508.282, "t": 73.88300000000004, "r": 536.914, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 508.282, "r_y0": 82.43499999999995, "r_x1": 536.914, "r_y1": 82.43499999999995, "r_x2": 536.914, "r_y2": 73.88300000000004, "r_x3": 508.282, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 317.06, "t": 86.23599999999999, "r": 361.643, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 94.78800000000001, "r_x1": 361.643, "r_y1": 94.78800000000001, "r_x2": 361.643, "r_y2": 86.23599999999999, "r_x3": 317.06, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 417.856, "t": 85.668, "r": 425.378, "b": 92.72199999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 92.72199999999998, "r_x1": 425.378, "r_y1": 92.72199999999998, "r_x2": 425.378, "r_y2": 85.668, "r_x3": 417.856, "r_y3": 85.668, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 449.896, "t": 85.668, "r": 457.417, "b": 92.72199999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 92.72199999999998, "r_x1": 457.417, "r_y1": 92.72199999999998, "r_x2": 457.417, "r_y2": 85.668, "r_x3": 449.896, "r_y3": 85.668, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 476.401, "t": 86.23599999999999, "r": 496.326, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 94.78800000000001, "r_x1": 496.326, "r_y1": 94.78800000000001, "r_x2": 496.326, "r_y2": 86.23599999999999, "r_x3": 476.401, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 512.635, "t": 86.23599999999999, "r": 532.56, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 94.78800000000001, "r_x1": 532.56, "r_y1": 94.78800000000001, "r_x2": 532.56, "r_y2": 86.23599999999999, "r_x3": 512.635, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 317.06, "t": 98.19100000000003, "r": 359.431, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 106.74300000000005, "r_x1": 359.431, "r_y1": 106.74300000000005, "r_x2": 359.431, "r_y2": 98.19100000000003, "r_x3": 317.06, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 417.856, "t": 97.62300000000005, "r": 425.378, "b": 104.67700000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 104.67700000000002, "r_x1": 425.378, "r_y1": 104.67700000000002, "r_x2": 425.378, "r_y2": 97.62300000000005, "r_x3": 417.856, "r_y3": 97.62300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 449.896, "t": 97.62300000000005, "r": 457.417, "b": 104.67700000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 104.67700000000002, "r_x1": 457.417, "r_y1": 104.67700000000002, "r_x2": 457.417, "r_y2": 97.62300000000005, "r_x3": 449.896, "r_y3": 97.62300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 476.401, "t": 98.19100000000003, "r": 496.326, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 106.74300000000005, "r_x1": 496.326, "r_y1": 106.74300000000005, "r_x2": 496.326, "r_y2": 98.19100000000003, "r_x3": 476.401, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 513.462, "t": 98.19100000000003, "r": 531.733, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.462, "r_y0": 106.74300000000005, "r_x1": 531.733, "r_y1": 106.74300000000005, "r_x2": 531.733, "r_y2": 98.19100000000003, "r_x3": 513.462, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 317.06, "t": 110.14700000000005, "r": 359.979, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 118.69899999999996, "r_x1": 359.979, "r_y1": 118.69899999999996, "r_x2": 359.979, "r_y2": 110.14700000000005, "r_x3": 317.06, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 417.856, "t": 109.57899999999995, "r": 425.378, "b": 116.63300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 116.63300000000004, "r_x1": 425.378, "r_y1": 116.63300000000004, "r_x2": 425.378, "r_y2": 109.57899999999995, "r_x3": 417.856, "r_y3": 109.57899999999995, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 450.812, "t": 109.57899999999995, "r": 456.501, "b": 116.63300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.812, "r_y0": 116.63300000000004, "r_x1": 456.501, "r_y1": 116.63300000000004, "r_x2": 456.501, "r_y2": 109.57899999999995, "r_x3": 450.812, "r_y3": 109.57899999999995, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 476.401, "t": 110.14700000000005, "r": 496.326, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 118.69899999999996, "r_x1": 496.326, "r_y1": 118.69899999999996, "r_x2": 496.326, "r_y2": 110.14700000000005, "r_x3": 476.401, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 511.25, "t": 110.14700000000005, "r": 533.945, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 511.25, "r_y0": 118.69899999999996, "r_x1": 533.945, "r_y1": 118.69899999999996, "r_x2": 533.945, "r_y2": 110.14700000000005, "r_x3": 511.25, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 317.06, "t": 122.10199999999998, "r": 400.377, "b": 130.654, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 130.654, "r_x1": 400.377, "r_y1": 130.654, "r_x2": 400.377, "r_y2": 122.10199999999998, "r_x3": 317.06, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 417.856, "t": 121.53399999999999, "r": 425.378, "b": 128.58799999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 128.58799999999997, "r_x1": 425.378, "r_y1": 128.58799999999997, "r_x2": 425.378, "r_y2": 121.53399999999999, "r_x3": 417.856, "r_y3": 121.53399999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 449.896, "t": 121.53399999999999, "r": 457.417, "b": 128.58799999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 128.58799999999997, "r_x1": 457.417, "r_y1": 128.58799999999997, "r_x2": 457.417, "r_y2": 121.53399999999999, "r_x3": 449.896, "r_y3": 121.53399999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 476.401, "t": 122.10199999999998, "r": 496.326, "b": 130.654, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 130.654, "r_x1": 496.326, "r_y1": 130.654, "r_x2": 496.326, "r_y2": 122.10199999999998, "r_x3": 476.401, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 512.635, "t": 122.10199999999998, "r": 532.56, "b": 130.654, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 130.654, "r_x1": 532.56, "r_y1": 130.654, "r_x2": 532.56, "r_y2": 122.10199999999998, "r_x3": 512.635, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 317.06, "t": 134.05700000000002, "r": 375.172, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 142.60900000000004, "r_x1": 375.172, "r_y1": 142.60900000000004, "r_x2": 375.172, "r_y2": 134.05700000000002, "r_x3": 317.06, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 417.856, "t": 133.48900000000003, "r": 425.378, "b": 140.543, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 140.543, "r_x1": 425.378, "r_y1": 140.543, "r_x2": 425.378, "r_y2": 133.48900000000003, "r_x3": 417.856, "r_y3": 133.48900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 449.896, "t": 133.48900000000003, "r": 457.417, "b": 140.543, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 140.543, "r_x1": 457.417, "r_y1": 140.543, "r_x2": 457.417, "r_y2": 133.48900000000003, "r_x3": 449.896, "r_y3": 133.48900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 476.401, "t": 134.05700000000002, "r": 496.326, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 142.60900000000004, "r_x1": 496.326, "r_y1": 142.60900000000004, "r_x2": 496.326, "r_y2": 134.05700000000002, "r_x3": 476.401, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 512.635, "t": 134.05700000000002, "r": 532.56, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 142.60900000000004, "r_x1": 532.56, "r_y1": 142.60900000000004, "r_x2": 532.56, "r_y2": 134.05700000000002, "r_x3": 512.635, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 317.06, "t": 146.01199999999994, "r": 369.394, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 154.56399999999996, "r_x1": 369.394, "r_y1": 154.56399999999996, "r_x2": 369.394, "r_y2": 146.01199999999994, "r_x3": 317.06, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 417.856, "t": 145.44399999999996, "r": 425.378, "b": 152.49800000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 152.49800000000005, "r_x1": 425.378, "r_y1": 152.49800000000005, "r_x2": 425.378, "r_y2": 145.44399999999996, "r_x3": 417.856, "r_y3": 145.44399999999996, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 449.896, "t": 145.44399999999996, "r": 457.417, "b": 152.49800000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 152.49800000000005, "r_x1": 457.417, "r_y1": 152.49800000000005, "r_x2": 457.417, "r_y2": 145.44399999999996, "r_x3": 449.896, "r_y3": 145.44399999999996, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 476.401, "t": 146.01199999999994, "r": 496.326, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 154.56399999999996, "r_x1": 496.326, "r_y1": 154.56399999999996, "r_x2": 496.326, "r_y2": 146.01199999999994, "r_x3": 476.401, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 512.635, "t": 146.01199999999994, "r": 532.56, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 154.56399999999996, "r_x1": 532.56, "r_y1": 154.56399999999996, "r_x2": 532.56, "r_y2": 146.01199999999994, "r_x3": 512.635, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 7, "num_cols": 5, "table_cells": [{"bbox": {"l": 412.332, "t": 73.88300000000004, "r": 430.902, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Tags", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 442.857, "t": 73.88300000000004, "r": 464.446, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Bbox", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 477.786, "t": 73.88300000000004, "r": 494.942, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "Size", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 508.282, "t": 73.88300000000004, "r": 536.914, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "Format", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 317.06, "t": 86.23599999999999, "r": 361.643, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 417.856, "t": 85.668, "r": 425.378, "b": 92.72199999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 449.896, "t": 85.668, "r": 457.417, "b": 92.72199999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 476.401, "t": 86.23599999999999, "r": 496.326, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "509k", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 512.635, "t": 86.23599999999999, "r": 532.56, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 317.06, "t": 98.19100000000003, "r": 359.431, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 417.856, "t": 97.62300000000005, "r": 425.378, "b": 104.67700000000002, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 449.896, "t": 97.62300000000005, "r": 457.417, "b": 104.67700000000002, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 476.401, "t": 98.19100000000003, "r": 496.326, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "112k", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 513.462, "t": 98.19100000000003, "r": 531.733, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PDF", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 317.06, "t": 110.14700000000005, "r": 359.979, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableBank", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 417.856, "t": 109.57899999999995, "r": 425.378, "b": 116.63300000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 450.812, "t": 109.57899999999995, "r": 456.501, "b": 116.63300000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "7", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 476.401, "t": 110.14700000000005, "r": 496.326, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "145k", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 511.25, "t": 110.14700000000005, "r": 533.945, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "JPEG", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 317.06, "t": 122.10199999999998, "r": 400.377, "b": 130.654, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Combined-Tabnet(*)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 417.856, "t": 121.53399999999999, "r": 425.378, "b": 128.58799999999997, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 449.896, "t": 121.53399999999999, "r": 457.417, "b": 128.58799999999997, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 476.401, "t": 122.10199999999998, "r": 496.326, "b": 130.654, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "400k", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 512.635, "t": 122.10199999999998, "r": 532.56, "b": 130.654, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 317.06, "t": 134.05700000000002, "r": 375.172, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Combined(**)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 417.856, "t": 133.48900000000003, "r": 425.378, "b": 140.543, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 449.896, "t": 133.48900000000003, "r": 457.417, "b": 140.543, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 476.401, "t": 134.05700000000002, "r": 496.326, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "500k", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 512.635, "t": 134.05700000000002, "r": 532.56, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 317.06, "t": 146.01199999999994, "r": 369.394, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "SynthTabNet", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 417.856, "t": 145.44399999999996, "r": 425.378, "b": 152.49800000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 449.896, "t": 145.44399999999996, "r": 457.417, "b": 152.49800000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 476.401, "t": 146.01199999999994, "r": 496.326, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "600k", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 512.635, "t": 146.01199999999994, "r": 532.56, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false}]}, {"label": "caption", "id": 9, "page_no": 3, "cluster": {"id": 9, "label": "caption", "bbox": {"l": 308.862, "t": 167.75099999999998, "r": 545.115, "b": 224.303, "coord_origin": "TOPLEFT"}, "confidence": 0.9667726755142212, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 176.48199999999997, "r_x1": 330.75, "r_y1": 176.48199999999997, "r_x2": 330.75, "r_y2": 167.92999999999995, "r_x3": 308.862, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 336.867, "r_y0": 176.48199999999997, "r_x1": 344.618, "r_y1": 176.48199999999997, "r_x2": 344.618, "r_y2": 167.92999999999995, "r_x3": 336.867, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "1:", "orig": "1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 361.076, "r_y0": 176.48199999999997, "r_x1": 380.453, "r_y1": 176.48199999999997, "r_x2": 380.453, "r_y2": 167.92999999999995, "r_x3": 361.076, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "Both", "orig": "Both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.568, "r_y0": 176.33900000000006, "r_x1": 468.68, "r_y1": 176.33900000000006, "r_x2": 468.68, "r_y2": 167.75099999999998, "r_x3": 386.568, "r_y3": 167.75099999999998, "coord_origin": "TOPLEFT"}, "text": "'Combined-Tabnet'", "orig": "'Combined-Tabnet'", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 474.796, "r_y0": 176.48199999999997, "r_x1": 489.182, "r_y1": 176.48199999999997, "r_x2": 489.182, "r_y2": 167.92999999999995, "r_x3": 474.796, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 495.299, "r_y0": 176.33900000000006, "r_x1": 545.112, "r_y1": 176.33900000000006, "r_x2": 545.112, "r_y2": 167.75099999999998, "r_x3": 495.299, "r_y3": 167.75099999999998, "coord_origin": "TOPLEFT"}, "text": "'Combined-", "orig": "'Combined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 188.29399999999998, "r_x1": 341.161, "r_y1": 188.29399999999998, "r_x2": 341.161, "r_y2": 179.70600000000002, "r_x3": 308.862, "r_y3": 179.70600000000002, "coord_origin": "TOPLEFT"}, "text": "Tabnet'", "orig": "Tabnet'", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 343.457, "r_y0": 188.437, "r_x1": 545.11, "r_y1": 188.437, "r_x2": 545.11, "r_y2": 179.885, "r_x3": 343.457, "r_y3": 179.885, "coord_origin": "TOPLEFT"}, "text": "are variations of the following: (*) The Combined-", "orig": "are variations of the following: (*) The Combined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 200.39200000000005, "r_x1": 545.115, "r_y1": 200.39200000000005, "r_x2": 545.115, "r_y2": 191.84000000000003, "r_x3": 308.862, "r_y3": 191.84000000000003, "coord_origin": "TOPLEFT"}, "text": "Tabnet dataset is the processed combination of PubTabNet", "orig": "Tabnet dataset is the processed combination of PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 212.34699999999998, "r_x1": 366.276, "r_y1": 212.34699999999998, "r_x2": 366.276, "r_y2": 203.79499999999996, "r_x3": 308.862, "r_y3": 203.79499999999996, "coord_origin": "TOPLEFT"}, "text": "and Fintabnet.", "orig": "and Fintabnet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 370.58, "r_y0": 212.34699999999998, "r_x1": 545.115, "r_y1": 212.34699999999998, "r_x2": 545.115, "r_y2": 203.79499999999996, "r_x3": 370.58, "r_y3": 203.79499999999996, "coord_origin": "TOPLEFT"}, "text": "(**) The combined dataset is the processed", "orig": "(**) The combined dataset is the processed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 224.303, "r_x1": 523.935, "r_y1": 224.303, "r_x2": 523.935, "r_y2": 215.75099999999998, "r_x3": 308.862, "r_y3": 215.75099999999998, "coord_origin": "TOPLEFT"}, "text": "combination of PubTabNet, Fintabnet and TableBank.", "orig": "combination of PubTabNet, Fintabnet and TableBank.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table 1: Both 'Combined-Tabnet' and 'CombinedTabnet' are variations of the following: (*) The CombinedTabnet dataset is the processed combination of PubTabNet and Fintabnet. (**) The combined dataset is the processed combination of PubTabNet, Fintabnet and TableBank."}, {"label": "text", "id": 6, "page_no": 3, "cluster": {"id": 6, "label": "text", "bbox": {"l": 308.862, "t": 249.889, "r": 545.115, "b": 294.306, "coord_origin": "TOPLEFT"}, "confidence": 0.978954017162323, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.44100000000003, "r_x1": 545.115, "r_y1": 258.44100000000003, "r_x2": 545.115, "r_y2": 249.889, "r_x3": 308.862, "r_y3": 249.889, "coord_origin": "TOPLEFT"}, "text": "one adopts a colorful appearance with high contrast and the", "orig": "one adopts a colorful appearance with high contrast and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 270.39599999999996, "r_x1": 545.115, "r_y1": 270.39599999999996, "r_x2": 545.115, "r_y2": 261.84400000000005, "r_x3": 308.862, "r_y3": 261.84400000000005, "coord_origin": "TOPLEFT"}, "text": "last one contains tables with sparse content. Lastly, we have", "orig": "last one contains tables with sparse content. Lastly, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 282.351, "r_x1": 545.115, "r_y1": 282.351, "r_x2": 545.115, "r_y2": 273.799, "r_x3": 308.862, "r_y3": 273.799, "coord_origin": "TOPLEFT"}, "text": "combined all synthetic datasets into one big unified syn-", "orig": "combined all synthetic datasets into one big unified syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 294.306, "r_x1": 436.822, "r_y1": 294.306, "r_x2": 436.822, "r_y2": 285.754, "r_x3": 308.862, "r_y3": 285.754, "coord_origin": "TOPLEFT"}, "text": "thetic dataset of 600k examples.", "orig": "thetic dataset of 600k examples.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "one adopts a colorful appearance with high contrast and the last one contains tables with sparse content. Lastly, we have combined all synthetic datasets into one big unified synthetic dataset of 600k examples."}, {"label": "text", "id": 13, "page_no": 3, "cluster": {"id": 13, "label": "text", "bbox": {"l": 320.817, "t": 298.041, "r": 542.744, "b": 306.593, "coord_origin": "TOPLEFT"}, "confidence": 0.9043695330619812, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 306.593, "r_x1": 542.744, "r_y1": 306.593, "r_x2": 542.744, "r_y2": 298.041, "r_x3": 320.817, "r_y3": 298.041, "coord_origin": "TOPLEFT"}, "text": "Tab. 1 summarizes the various attributes of the datasets.", "orig": "Tab. 1 summarizes the various attributes of the datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Tab. 1 summarizes the various attributes of the datasets."}, {"label": "section_header", "id": 11, "page_no": 3, "cluster": {"id": 11, "label": "section_header", "bbox": {"l": 308.862, "t": 321.184, "r": 444.936, "b": 331.932, "coord_origin": "TOPLEFT"}, "confidence": 0.9466595649719238, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 331.932, "r_x1": 444.936, "r_y1": 331.932, "r_x2": 444.936, "r_y2": 321.184, "r_x3": 308.862, "r_y3": 321.184, "coord_origin": "TOPLEFT"}, "text": "4. The TableFormer model", "orig": "4. The TableFormer model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4. The TableFormer model"}, {"label": "text", "id": 0, "page_no": 3, "cluster": {"id": 0, "label": "text", "bbox": {"l": 308.862, "t": 342.208, "r": 545.115, "b": 446.401, "coord_origin": "TOPLEFT"}, "confidence": 0.9884450435638428, "cells": [{"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 350.76, "r_x1": 545.115, "r_y1": 350.76, "r_x2": 545.115, "r_y2": 342.208, "r_x3": 320.817, "r_y3": 342.208, "coord_origin": "TOPLEFT"}, "text": "Given the image of a table, TableFormer is able to pre-", "orig": "Given the image of a table, TableFormer is able to pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 362.715, "r_x1": 326.576, "r_y1": 362.715, "r_x2": 326.576, "r_y2": 354.163, "r_x3": 308.862, "r_y3": 354.163, "coord_origin": "TOPLEFT"}, "text": "dict:", "orig": "dict:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.172, "r_y0": 362.715, "r_x1": 545.115, "r_y1": 362.715, "r_x2": 545.115, "r_y2": 354.163, "r_x3": 330.172, "r_y3": 354.163, "coord_origin": "TOPLEFT"}, "text": "1) a sequence of tokens that represent the structure of", "orig": "1) a sequence of tokens that represent the structure of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 374.67, "r_x1": 545.115, "r_y1": 374.67, "r_x2": 545.115, "r_y2": 366.118, "r_x3": 308.862, "r_y3": 366.118, "coord_origin": "TOPLEFT"}, "text": "a table, and 2) a bounding box coupled to a subset of those", "orig": "a table, and 2) a bounding box coupled to a subset of those", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 386.625, "r_x1": 337.265, "r_y1": 386.625, "r_x2": 337.265, "r_y2": 378.073, "r_x3": 308.862, "r_y3": 378.073, "coord_origin": "TOPLEFT"}, "text": "tokens.", "orig": "tokens.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.808, "r_y0": 386.625, "r_x1": 545.115, "r_y1": 386.625, "r_x2": 545.115, "r_y2": 378.073, "r_x3": 341.808, "r_y3": 378.073, "coord_origin": "TOPLEFT"}, "text": "The conversion of an image into a sequence of to-", "orig": "The conversion of an image into a sequence of to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 398.58, "r_x1": 545.115, "r_y1": 398.58, "r_x2": 545.115, "r_y2": 390.028, "r_x3": 308.862, "r_y3": 390.028, "coord_origin": "TOPLEFT"}, "text": "kens is a well-known task [35, 16]. While attention is often", "orig": "kens is a well-known task [35, 16]. While attention is often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 410.535, "r_x1": 545.115, "r_y1": 410.535, "r_x2": 545.115, "r_y2": 401.983, "r_x3": 308.862, "r_y3": 401.983, "coord_origin": "TOPLEFT"}, "text": "used as an implicit method to associate each token of the", "orig": "used as an implicit method to associate each token of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 422.491, "r_x1": 545.115, "r_y1": 422.491, "r_x2": 545.115, "r_y2": 413.939, "r_x3": 308.862, "r_y3": 413.939, "coord_origin": "TOPLEFT"}, "text": "sequence with a position in the original image, an explicit", "orig": "sequence with a position in the original image, an explicit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 434.446, "r_x1": 545.115, "r_y1": 434.446, "r_x2": 545.115, "r_y2": 425.894, "r_x3": 308.862, "r_y3": 425.894, "coord_origin": "TOPLEFT"}, "text": "association between the individual table-cells and the image", "orig": "association between the individual table-cells and the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 446.401, "r_x1": 437.937, "r_y1": 446.401, "r_x2": 437.937, "r_y2": 437.849, "r_x3": 308.862, "r_y3": 437.849, "coord_origin": "TOPLEFT"}, "text": "bounding boxes is also required.", "orig": "bounding boxes is also required.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Given the image of a table, TableFormer is able to predict: 1) a sequence of tokens that represent the structure of a table, and 2) a bounding box coupled to a subset of those tokens. The conversion of an image into a sequence of tokens is a well-known task [35, 16]. While attention is often used as an implicit method to associate each token of the sequence with a position in the original image, an explicit association between the individual table-cells and the image bounding boxes is also required."}, {"label": "section_header", "id": 12, "page_no": 3, "cluster": {"id": 12, "label": "section_header", "bbox": {"l": 308.862, "t": 457.694, "r": 420.161, "b": 467.546, "coord_origin": "TOPLEFT"}, "confidence": 0.937696099281311, "cells": [{"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 467.546, "r_x1": 420.161, "r_y1": 467.546, "r_x2": 420.161, "r_y2": 457.694, "r_x3": 308.862, "r_y3": 457.694, "coord_origin": "TOPLEFT"}, "text": "4.1. Model architecture.", "orig": "4.1. Model architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4.1. Model architecture."}, {"label": "text", "id": 2, "page_no": 3, "cluster": {"id": 2, "label": "text", "bbox": {"l": 308.862, "t": 477.034, "r": 545.116, "b": 664.914, "coord_origin": "TOPLEFT"}, "confidence": 0.9878323078155518, "cells": [{"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 485.586, "r_x1": 545.115, "r_y1": 485.586, "r_x2": 545.115, "r_y2": 477.034, "r_x3": 320.817, "r_y3": 477.034, "coord_origin": "TOPLEFT"}, "text": "We now describe in detail the proposed method, which", "orig": "We now describe in detail the proposed method, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 497.541, "r_x1": 315.507, "r_y1": 497.541, "r_x2": 315.507, "r_y2": 488.989, "r_x3": 308.862, "r_y3": 488.989, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 319.153, "r_y0": 497.541, "r_x1": 509.021, "r_y1": 497.541, "r_x2": 509.021, "r_y2": 488.989, "r_x3": 319.153, "r_y3": 488.989, "coord_origin": "TOPLEFT"}, "text": "composed of three main components, see Fig.", "orig": "composed of three main components, see Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.586, "r_y0": 497.541, "r_x1": 523.058, "r_y1": 497.541, "r_x2": 523.058, "r_y2": 488.989, "r_x3": 515.586, "r_y3": 488.989, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 529.623, "r_y0": 497.541, "r_x1": 545.115, "r_y1": 497.541, "r_x2": 545.115, "r_y2": 488.989, "r_x3": 529.623, "r_y3": 488.989, "coord_origin": "TOPLEFT"}, "text": "Our", "orig": "Our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 509.353, "r_x1": 406.346, "r_y1": 509.353, "r_x2": 406.346, "r_y2": 500.765, "r_x3": 308.862, "r_y3": 500.765, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.872, "r_y0": 509.496, "r_x1": 545.111, "r_y1": 509.496, "r_x2": 545.111, "r_y2": 500.944, "r_x3": 408.872, "r_y3": 500.944, "coord_origin": "TOPLEFT"}, "text": "encodes the input as a feature vec-", "orig": "encodes the input as a feature vec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 521.452, "r_x1": 319.93, "r_y1": 521.452, "r_x2": 319.93, "r_y2": 512.9, "r_x3": 308.862, "r_y3": 512.9, "coord_origin": "TOPLEFT"}, "text": "tor", "orig": "tor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.836, "r_y0": 521.452, "r_x1": 409.395, "r_y1": 521.452, "r_x2": 409.395, "r_y2": 512.9, "r_x3": 323.836, "r_y3": 512.9, "coord_origin": "TOPLEFT"}, "text": "of predefined length.", "orig": "of predefined length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.727, "r_y0": 521.452, "r_x1": 545.115, "r_y1": 521.452, "r_x2": 545.115, "r_y2": 512.9, "r_x3": 416.727, "r_y3": 512.9, "coord_origin": "TOPLEFT"}, "text": "The input feature vector of the", "orig": "The input feature vector of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.4069999999999, "r_x1": 436.194, "r_y1": 533.4069999999999, "r_x2": 436.194, "r_y2": 524.855, "r_x3": 308.862, "r_y3": 524.855, "coord_origin": "TOPLEFT"}, "text": "encoded image is passed to the", "orig": "encoded image is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.526, "r_y0": 533.264, "r_x1": 513.867, "r_y1": 533.264, "r_x2": 513.867, "r_y2": 524.6759999999999, "r_x3": 439.526, "r_y3": 524.6759999999999, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 517.432, "r_y0": 533.4069999999999, "r_x1": 545.108, "r_y1": 533.4069999999999, "r_x2": 545.108, "r_y2": 524.855, "r_x3": 517.432, "r_y3": 524.855, "coord_origin": "TOPLEFT"}, "text": "to pro-", "orig": "to pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.362, "r_x1": 545.115, "r_y1": 545.362, "r_x2": 545.115, "r_y2": 536.81, "r_x3": 308.862, "r_y3": 536.81, "coord_origin": "TOPLEFT"}, "text": "duce a sequence of HTML tags that represent the structure", "orig": "duce a sequence of HTML tags that represent the structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 557.317, "r_x1": 358.545, "r_y1": 557.317, "r_x2": 358.545, "r_y2": 548.765, "r_x3": 308.862, "r_y3": 548.765, "coord_origin": "TOPLEFT"}, "text": "of the table.", "orig": "of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.191, "r_y0": 557.317, "r_x1": 545.115, "r_y1": 557.317, "r_x2": 545.115, "r_y2": 548.765, "r_x3": 365.191, "r_y3": 548.765, "coord_origin": "TOPLEFT"}, "text": "With each prediction of an HTML standard", "orig": "With each prediction of an HTML standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.2719999999999, "r_x1": 352.409, "r_y1": 569.2719999999999, "r_x2": 352.409, "r_y2": 560.72, "r_x3": 308.862, "r_y3": 560.72, "coord_origin": "TOPLEFT"}, "text": "data cell ('", "orig": "data cell ('", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 352.409, "r_y0": 569.108, "r_x1": 360.158, "r_y1": 569.108, "r_x2": 360.158, "r_y2": 560.402, "r_x3": 352.409, "r_y3": 560.402, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.158, "r_y0": 569.2719999999999, "r_x1": 367.909, "r_y1": 569.2719999999999, "r_x2": 367.909, "r_y2": 560.72, "r_x3": 360.158, "r_y3": 560.72, "coord_origin": "TOPLEFT"}, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.909, "r_y0": 569.108, "r_x1": 375.658, "r_y1": 569.108, "r_x2": 375.658, "r_y2": 560.402, "r_x3": 367.909, "r_y3": 560.402, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.658, "r_y0": 569.2719999999999, "r_x1": 545.112, "r_y1": 569.2719999999999, "r_x2": 545.112, "r_y2": 560.72, "r_x3": 375.658, "r_y3": 560.72, "coord_origin": "TOPLEFT"}, "text": "') the hidden state of that cell is passed to", "orig": "') the hidden state of that cell is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 581.2280000000001, "r_x1": 545.115, "r_y1": 581.2280000000001, "r_x2": 545.115, "r_y2": 572.6759999999999, "r_x3": 308.862, "r_y3": 572.6759999999999, "coord_origin": "TOPLEFT"}, "text": "the Cell BBox Decoder. As for spanning cells, such as row", "orig": "the Cell BBox Decoder. As for spanning cells, such as row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 593.183, "r_x1": 483.118, "r_y1": 593.183, "r_x2": 483.118, "r_y2": 584.631, "r_x3": 308.862, "r_y3": 584.631, "coord_origin": "TOPLEFT"}, "text": "or column span, the tag is broken down to '", "orig": "or column span, the tag is broken down to '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.119, "r_y0": 593.019, "r_x1": 490.868, "r_y1": 593.019, "r_x2": 490.868, "r_y2": 584.313, "r_x3": 483.119, "r_y3": 584.313, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.868, "r_y0": 593.183, "r_x1": 545.114, "r_y1": 593.183, "r_x2": 545.114, "r_y2": 584.631, "r_x3": 490.868, "r_y3": 584.631, "coord_origin": "TOPLEFT"}, "text": "', 'rowspan='", "orig": "', 'rowspan='", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.138, "r_x1": 545.115, "r_y1": 605.138, "r_x2": 545.115, "r_y2": 596.586, "r_x3": 308.862, "r_y3": 596.586, "coord_origin": "TOPLEFT"}, "text": "or 'colspan=', with the number of spanning cells (attribute),", "orig": "or 'colspan=', with the number of spanning cells (attribute),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.093, "r_x1": 329.644, "r_y1": 617.093, "r_x2": 329.644, "r_y2": 608.5409999999999, "r_x3": 308.862, "r_y3": 608.5409999999999, "coord_origin": "TOPLEFT"}, "text": "and '", "orig": "and '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 329.646, "r_y0": 616.929, "r_x1": 337.395, "r_y1": 616.929, "r_x2": 337.395, "r_y2": 608.223, "r_x3": 329.646, "r_y3": 608.223, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.394, "r_y0": 617.093, "r_x1": 343.202, "r_y1": 617.093, "r_x2": 343.202, "r_y2": 608.5409999999999, "r_x3": 337.394, "r_y3": 608.5409999999999, "coord_origin": "TOPLEFT"}, "text": "'.", "orig": "'.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.064, "r_y0": 617.093, "r_x1": 468.591, "r_y1": 617.093, "r_x2": 468.591, "r_y2": 608.5409999999999, "r_x3": 348.064, "r_y3": 608.5409999999999, "coord_origin": "TOPLEFT"}, "text": "The hidden state attached to '", "orig": "The hidden state attached to '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.595, "r_y0": 616.929, "r_x1": 476.344, "r_y1": 616.929, "r_x2": 476.344, "r_y2": 608.223, "r_x3": 468.595, "r_y3": 608.223, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.344, "r_y0": 617.093, "r_x1": 545.116, "r_y1": 617.093, "r_x2": 545.116, "r_y2": 608.5409999999999, "r_x3": 476.344, "r_y3": 608.5409999999999, "coord_origin": "TOPLEFT"}, "text": "' is passed to the", "orig": "' is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.048, "r_x1": 545.115, "r_y1": 629.048, "r_x2": 545.115, "r_y2": 620.496, "r_x3": 308.862, "r_y3": 620.496, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder. A shared feed forward network (FFN)", "orig": "Cell BBox Decoder. A shared feed forward network (FFN)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.0029999999999, "r_x1": 533.2, "r_y1": 641.0029999999999, "r_x2": 533.2, "r_y2": 632.451, "r_x3": 308.862, "r_y3": 632.451, "coord_origin": "TOPLEFT"}, "text": "receives the hidden states from the Structure Decoder,", "orig": "receives the hidden states from the Structure Decoder,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 537.364, "r_y0": 641.0029999999999, "r_x1": 545.115, "r_y1": 641.0029999999999, "r_x2": 545.115, "r_y2": 632.451, "r_x3": 537.364, "r_y3": 632.451, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 652.9590000000001, "r_x1": 545.115, "r_y1": 652.9590000000001, "r_x2": 545.115, "r_y2": 644.407, "r_x3": 308.862, "r_y3": 644.407, "coord_origin": "TOPLEFT"}, "text": "provide the final detection predictions of the bounding box", "orig": "provide the final detection predictions of the bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 664.914, "r_x1": 449.424, "r_y1": 664.914, "r_x2": 449.424, "r_y2": 656.362, "r_x3": 308.862, "r_y3": 656.362, "coord_origin": "TOPLEFT"}, "text": "coordinates and their classification.", "orig": "coordinates and their classification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We now describe in detail the proposed method, which is composed of three main components, see Fig. 4. Our CNN Backbone Network encodes the input as a feature vector of predefined length. The input feature vector of the encoded image is passed to the Structure Decoder to produce a sequence of HTML tags that represent the structure of the table. With each prediction of an HTML standard data cell (' < td > ') the hidden state of that cell is passed to the Cell BBox Decoder. As for spanning cells, such as row or column span, the tag is broken down to ' < ', 'rowspan=' or 'colspan=', with the number of spanning cells (attribute), and ' > '. The hidden state attached to ' < ' is passed to the Cell BBox Decoder. A shared feed forward network (FFN) receives the hidden states from the Structure Decoder, to provide the final detection predictions of the bounding box coordinates and their classification."}, {"label": "text", "id": 7, "page_no": 3, "cluster": {"id": 7, "label": "text", "bbox": {"l": 308.862, "t": 668.261, "r": 545.115, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.978580117225647, "cells": [{"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 677.217, "r_x1": 431.91, "r_y1": 677.217, "r_x2": 431.91, "r_y2": 668.261, "r_x3": 320.817, "r_y3": 668.261, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network.", "orig": "CNN Backbone Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.499, "r_y0": 677.201, "r_x1": 545.113, "r_y1": 677.201, "r_x2": 545.113, "r_y2": 668.649, "r_x3": 439.499, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "A ResNet-18 CNN is the", "orig": "A ResNet-18 CNN is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 308.862, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "backbone that receives the table image and encodes it as a", "orig": "backbone that receives the table image and encodes it as a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "vector of predefined length. The network has been modified", "orig": "vector of predefined length. The network has been modified", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "by removing the linear and pooling layer, as we are not per-", "orig": "by removing the linear and pooling layer, as we are not per-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "CNN Backbone Network. A ResNet-18 CNN is the backbone that receives the table image and encodes it as a vector of predefined length. The network has been modified by removing the linear and pooling layer, as we are not per-"}, {"label": "page_footer", "id": 14, "page_no": 3, "cluster": {"id": 14, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8565718531608582, "cells": [{"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4"}], "body": [{"label": "text", "id": 10, "page_no": 3, "cluster": {"id": 10, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 286.365, "b": 95.98400000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9611433148384094, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "amount of such tables, and kept only those ones ranging", "orig": "amount of such tables, and kept only those ones ranging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 95.98400000000004, "r_x1": 212.283, "r_y1": 95.98400000000004, "r_x2": 212.283, "r_y2": 87.43200000000002, "r_x3": 50.112, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "between 1*1 and 20*10 (rows/columns).", "orig": "between 1*1 and 20*10 (rows/columns).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "amount of such tables, and kept only those ones ranging between 1*1 and 20*10 (rows/columns)."}, {"label": "text", "id": 1, "page_no": 3, "cluster": {"id": 1, "label": "text", "bbox": {"l": 50.112, "t": 101.22900000000004, "r": 286.365, "b": 313.019, "coord_origin": "TOPLEFT"}, "confidence": 0.988013744354248, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 109.78099999999995, "r_x1": 286.365, "r_y1": 109.78099999999995, "r_x2": 286.365, "r_y2": 101.22900000000004, "r_x3": 62.067, "r_y3": 101.22900000000004, "coord_origin": "TOPLEFT"}, "text": "The availability of the bounding boxes for all table cells", "orig": "The availability of the bounding boxes for all table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 121.73599999999999, "r_x1": 176.458, "r_y1": 121.73599999999999, "r_x2": 176.458, "r_y2": 113.18399999999997, "r_x3": 50.112, "r_y3": 113.18399999999997, "coord_origin": "TOPLEFT"}, "text": "is essential to train our models.", "orig": "is essential to train our models.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.971, "r_y0": 121.73599999999999, "r_x1": 286.365, "r_y1": 121.73599999999999, "r_x2": 286.365, "r_y2": 113.18399999999997, "r_x3": 180.971, "r_y3": 113.18399999999997, "coord_origin": "TOPLEFT"}, "text": "In order to distinguish be-", "orig": "In order to distinguish be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 133.69100000000003, "r_x1": 286.365, "r_y1": 133.69100000000003, "r_x2": 286.365, "r_y2": 125.13900000000001, "r_x3": 50.112, "r_y3": 125.13900000000001, "coord_origin": "TOPLEFT"}, "text": "tween empty and non-empty bounding boxes, we have in-", "orig": "tween empty and non-empty bounding boxes, we have in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 145.64700000000005, "r_x1": 286.365, "r_y1": 145.64700000000005, "r_x2": 286.365, "r_y2": 137.09500000000003, "r_x3": 50.112, "r_y3": 137.09500000000003, "coord_origin": "TOPLEFT"}, "text": "troduced a binary class in the annotation. Unfortunately, the", "orig": "troduced a binary class in the annotation. Unfortunately, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 157.60199999999998, "r_x1": 286.365, "r_y1": 157.60199999999998, "r_x2": 286.365, "r_y2": 149.04999999999995, "r_x3": 50.112, "r_y3": 149.04999999999995, "coord_origin": "TOPLEFT"}, "text": "original datasets either omit the bounding boxes for whole", "orig": "original datasets either omit the bounding boxes for whole", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 169.55700000000002, "r_x1": 94.127, "r_y1": 169.55700000000002, "r_x2": 94.127, "r_y2": 161.005, "r_x3": 50.112, "r_y3": 161.005, "coord_origin": "TOPLEFT"}, "text": "tables (e.g.", "orig": "tables (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 98.959, "r_y0": 169.55700000000002, "r_x1": 286.365, "r_y1": 169.55700000000002, "r_x2": 286.365, "r_y2": 161.005, "r_x3": 98.959, "r_y3": 161.005, "coord_origin": "TOPLEFT"}, "text": "TableBank) or they narrow their scope only to", "orig": "TableBank) or they narrow their scope only to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 181.51199999999994, "r_x1": 116.951, "r_y1": 181.51199999999994, "r_x2": 116.951, "r_y2": 172.96000000000004, "r_x3": 50.112, "r_y3": 172.96000000000004, "coord_origin": "TOPLEFT"}, "text": "non-empty cells.", "orig": "non-empty cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 121.345, "r_y0": 181.51199999999994, "r_x1": 286.365, "r_y1": 181.51199999999994, "r_x2": 286.365, "r_y2": 172.96000000000004, "r_x3": 121.345, "r_y3": 172.96000000000004, "coord_origin": "TOPLEFT"}, "text": "Therefore, it was imperative to introduce", "orig": "Therefore, it was imperative to introduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 193.46699999999998, "r_x1": 286.365, "r_y1": 193.46699999999998, "r_x2": 286.365, "r_y2": 184.91499999999996, "r_x3": 50.112, "r_y3": 184.91499999999996, "coord_origin": "TOPLEFT"}, "text": "a data pre-processing procedure that generates the missing", "orig": "a data pre-processing procedure that generates the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 205.423, "r_x1": 286.365, "r_y1": 205.423, "r_x2": 286.365, "r_y2": 196.87099999999998, "r_x3": 50.112, "r_y3": 196.87099999999998, "coord_origin": "TOPLEFT"}, "text": "bounding boxes out of the annotation information. This pro-", "orig": "bounding boxes out of the annotation information. This pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 217.37800000000004, "r_x1": 286.365, "r_y1": 217.37800000000004, "r_x2": 286.365, "r_y2": 208.82600000000002, "r_x3": 50.112, "r_y3": 208.82600000000002, "coord_origin": "TOPLEFT"}, "text": "cedure first parses the provided table structure and calcu-", "orig": "cedure first parses the provided table structure and calcu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 229.33299999999997, "r_x1": 286.365, "r_y1": 229.33299999999997, "r_x2": 286.365, "r_y2": 220.78099999999995, "r_x3": 50.112, "r_y3": 220.78099999999995, "coord_origin": "TOPLEFT"}, "text": "lates the dimensions of the most fine-grained grid that cov-", "orig": "lates the dimensions of the most fine-grained grid that cov-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 241.288, "r_x1": 139.805, "r_y1": 241.288, "r_x2": 139.805, "r_y2": 232.736, "r_x3": 50.112, "r_y3": 232.736, "coord_origin": "TOPLEFT"}, "text": "ers the table structure.", "orig": "ers the table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 144.607, "r_y0": 241.288, "r_x1": 286.365, "r_y1": 241.288, "r_x2": 286.365, "r_y2": 232.736, "r_x3": 144.607, "r_y3": 232.736, "coord_origin": "TOPLEFT"}, "text": "Notice that each table cell may oc-", "orig": "Notice that each table cell may oc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 253.24300000000005, "r_x1": 286.365, "r_y1": 253.24300000000005, "r_x2": 286.365, "r_y2": 244.69100000000003, "r_x3": 50.112, "r_y3": 244.69100000000003, "coord_origin": "TOPLEFT"}, "text": "cupy multiple grid squares due to row or column spans. In", "orig": "cupy multiple grid squares due to row or column spans. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 265.198, "r_x1": 286.365, "r_y1": 265.198, "r_x2": 286.365, "r_y2": 256.64599999999996, "r_x3": 50.112, "r_y3": 256.64599999999996, "coord_origin": "TOPLEFT"}, "text": "case of PubTabNet we had to compute missing bounding", "orig": "case of PubTabNet we had to compute missing bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 277.154, "r_x1": 286.365, "r_y1": 277.154, "r_x2": 286.365, "r_y2": 268.602, "r_x3": 50.112, "r_y3": 268.602, "coord_origin": "TOPLEFT"}, "text": "boxes for 48% of the simple and 69% of the complex ta-", "orig": "boxes for 48% of the simple and 69% of the complex ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 289.109, "r_x1": 68.652, "r_y1": 289.109, "r_x2": 68.652, "r_y2": 280.557, "r_x3": 50.112, "r_y3": 280.557, "coord_origin": "TOPLEFT"}, "text": "bles.", "orig": "bles.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 75.566, "r_y0": 289.109, "r_x1": 286.365, "r_y1": 289.109, "r_x2": 286.365, "r_y2": 280.557, "r_x3": 75.566, "r_y3": 280.557, "coord_origin": "TOPLEFT"}, "text": "Regarding FinTabNet, 68% of the simple and 98%", "orig": "Regarding FinTabNet, 68% of the simple and 98%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 301.064, "r_x1": 286.365, "r_y1": 301.064, "r_x2": 286.365, "r_y2": 292.512, "r_x3": 50.112, "r_y3": 292.512, "coord_origin": "TOPLEFT"}, "text": "of the complex tables require the generation of bounding", "orig": "of the complex tables require the generation of bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 313.019, "r_x1": 75.696, "r_y1": 313.019, "r_x2": 75.696, "r_y2": 304.467, "r_x3": 50.112, "r_y3": 304.467, "coord_origin": "TOPLEFT"}, "text": "boxes.", "orig": "boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The availability of the bounding boxes for all table cells is essential to train our models. In order to distinguish between empty and non-empty bounding boxes, we have introduced a binary class in the annotation. Unfortunately, the original datasets either omit the bounding boxes for whole tables (e.g. TableBank) or they narrow their scope only to non-empty cells. Therefore, it was imperative to introduce a data pre-processing procedure that generates the missing bounding boxes out of the annotation information. This procedure first parses the provided table structure and calculates the dimensions of the most fine-grained grid that covers the table structure. Notice that each table cell may occupy multiple grid squares due to row or column spans. In case of PubTabNet we had to compute missing bounding boxes for 48% of the simple and 69% of the complex tables. Regarding FinTabNet, 68% of the simple and 98% of the complex tables require the generation of bounding boxes."}, {"label": "text", "id": 4, "page_no": 3, "cluster": {"id": 4, "label": "text", "bbox": {"l": 50.112, "t": 318.264, "r": 286.365, "b": 434.413, "coord_origin": "TOPLEFT"}, "confidence": 0.9873981475830078, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 326.816, "r_x1": 286.365, "r_y1": 326.816, "r_x2": 286.365, "r_y2": 318.264, "r_x3": 62.067, "r_y3": 318.264, "coord_origin": "TOPLEFT"}, "text": "As it is illustrated in Fig. 2, the table distributions from", "orig": "As it is illustrated in Fig. 2, the table distributions from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 338.772, "r_x1": 60.075, "r_y1": 338.772, "r_x2": 60.075, "r_y2": 330.22, "r_x3": 50.112, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.146, "r_y0": 338.772, "r_x1": 96.687, "r_y1": 338.772, "r_x2": 96.687, "r_y2": 330.22, "r_x3": 65.146, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "datasets", "orig": "datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.768, "r_y0": 338.772, "r_x1": 113.932, "r_y1": 338.772, "r_x2": 113.932, "r_y2": 330.22, "r_x3": 101.768, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "are", "orig": "are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.003, "r_y0": 338.772, "r_x1": 148.533, "r_y1": 338.772, "r_x2": 148.533, "r_y2": 330.22, "r_x3": 119.003, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "skewed", "orig": "skewed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.613, "r_y0": 338.772, "r_x1": 184.806, "r_y1": 338.772, "r_x2": 184.806, "r_y2": 330.22, "r_x3": 153.613, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "towards", "orig": "towards", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 189.877, "r_y0": 338.772, "r_x1": 219.765, "r_y1": 338.772, "r_x2": 219.765, "r_y2": 330.22, "r_x3": 189.877, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "simpler", "orig": "simpler", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.836, "r_y0": 338.772, "r_x1": 263.571, "r_y1": 338.772, "r_x2": 263.571, "r_y2": 330.22, "r_x3": 224.836, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "structures", "orig": "structures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 268.652, "r_y0": 338.772, "r_x1": 286.365, "r_y1": 338.772, "r_x2": 286.365, "r_y2": 330.22, "r_x3": 268.652, "r_y3": 330.22, "coord_origin": "TOPLEFT"}, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 350.727, "r_x1": 286.365, "r_y1": 350.727, "r_x2": 286.365, "r_y2": 342.175, "r_x3": 50.112, "r_y3": 342.175, "coord_origin": "TOPLEFT"}, "text": "fewer number of rows/columns. Additionally, there is very", "orig": "fewer number of rows/columns. Additionally, there is very", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 362.682, "r_x1": 286.365, "r_y1": 362.682, "r_x2": 286.365, "r_y2": 354.13, "r_x3": 50.112, "r_y3": 354.13, "coord_origin": "TOPLEFT"}, "text": "limited variance in the table styles, which in case of Pub-", "orig": "limited variance in the table styles, which in case of Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 374.637, "r_x1": 286.365, "r_y1": 374.637, "r_x2": 286.365, "r_y2": 366.085, "r_x3": 50.112, "r_y3": 366.085, "coord_origin": "TOPLEFT"}, "text": "TabNet and FinTabNet means one styling format for the", "orig": "TabNet and FinTabNet means one styling format for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 386.592, "r_x1": 141.589, "r_y1": 386.592, "r_x2": 141.589, "r_y2": 378.04, "r_x3": 50.112, "r_y3": 378.04, "coord_origin": "TOPLEFT"}, "text": "majority of the tables.", "orig": "majority of the tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.702, "r_y0": 386.592, "r_x1": 286.365, "r_y1": 386.592, "r_x2": 286.365, "r_y2": 378.04, "r_x3": 148.702, "r_y3": 378.04, "coord_origin": "TOPLEFT"}, "text": "Similar limitations appear also in", "orig": "Similar limitations appear also in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 398.547, "r_x1": 286.365, "r_y1": 398.547, "r_x2": 286.365, "r_y2": 389.995, "r_x3": 50.112, "r_y3": 389.995, "coord_origin": "TOPLEFT"}, "text": "the type of table content, which in some cases (e.g. FinTab-", "orig": "the type of table content, which in some cases (e.g. FinTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 410.503, "r_x1": 201.822, "r_y1": 410.503, "r_x2": 201.822, "r_y2": 401.951, "r_x3": 50.112, "r_y3": 401.951, "coord_origin": "TOPLEFT"}, "text": "Net) is restricted to a certain domain.", "orig": "Net) is restricted to a certain domain.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.764, "r_y0": 410.503, "r_x1": 286.365, "r_y1": 410.503, "r_x2": 286.365, "r_y2": 401.951, "r_x3": 206.764, "r_y3": 401.951, "coord_origin": "TOPLEFT"}, "text": "Ultimately, the lack", "orig": "Ultimately, the lack", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 422.458, "r_x1": 286.365, "r_y1": 422.458, "r_x2": 286.365, "r_y2": 413.906, "r_x3": 50.112, "r_y3": 413.906, "coord_origin": "TOPLEFT"}, "text": "of diversity in the training dataset damages the ability of the", "orig": "of diversity in the training dataset damages the ability of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 434.413, "r_x1": 216.398, "r_y1": 434.413, "r_x2": 216.398, "r_y2": 425.861, "r_x3": 50.112, "r_y3": 425.861, "coord_origin": "TOPLEFT"}, "text": "models to generalize well on unseen data.", "orig": "models to generalize well on unseen data.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "As it is illustrated in Fig. 2, the table distributions from all datasets are skewed towards simpler structures with fewer number of rows/columns. Additionally, there is very limited variance in the table styles, which in case of PubTabNet and FinTabNet means one styling format for the majority of the tables. Similar limitations appear also in the type of table content, which in some cases (e.g. FinTabNet) is restricted to a certain domain. Ultimately, the lack of diversity in the training dataset damages the ability of the models to generalize well on unseen data."}, {"label": "text", "id": 3, "page_no": 3, "cluster": {"id": 3, "label": "text", "bbox": {"l": 50.112, "t": 439.658, "r": 286.367, "b": 627.538, "coord_origin": "TOPLEFT"}, "confidence": 0.9876030087471008, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 448.21, "r_x1": 286.365, "r_y1": 448.21, "r_x2": 286.365, "r_y2": 439.658, "r_x3": 62.067, "r_y3": 439.658, "coord_origin": "TOPLEFT"}, "text": "Motivated by those observations we aimed at generating", "orig": "Motivated by those observations we aimed at generating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 460.165, "r_x1": 172.144, "r_y1": 460.165, "r_x2": 172.144, "r_y2": 451.613, "r_x3": 50.112, "r_y3": 451.613, "coord_origin": "TOPLEFT"}, "text": "a synthetic table dataset named", "orig": "a synthetic table dataset named", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 174.148, "r_y0": 460.022, "r_x1": 224.708, "r_y1": 460.022, "r_x2": 224.708, "r_y2": 451.434, "r_x3": 174.148, "r_y3": 451.434, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.708, "r_y0": 460.165, "r_x1": 227.199, "r_y1": 460.165, "r_x2": 227.199, "r_y2": 451.613, "r_x3": 224.708, "r_y3": 451.613, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 230.128, "r_y0": 460.165, "r_x1": 286.367, "r_y1": 460.165, "r_x2": 286.367, "r_y2": 451.613, "r_x3": 230.128, "r_y3": 451.613, "coord_origin": "TOPLEFT"}, "text": "This approach", "orig": "This approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 472.121, "r_x1": 128.179, "r_y1": 472.121, "r_x2": 128.179, "r_y2": 463.569, "r_x3": 50.112, "r_y3": 463.569, "coord_origin": "TOPLEFT"}, "text": "offers control over:", "orig": "offers control over:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.971, "r_y0": 472.121, "r_x1": 286.365, "r_y1": 472.121, "r_x2": 286.365, "r_y2": 463.569, "r_x3": 132.971, "r_y3": 463.569, "coord_origin": "TOPLEFT"}, "text": "1) the size of the dataset, 2) the table", "orig": "1) the size of the dataset, 2) the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 484.076, "r_x1": 266.739, "r_y1": 484.076, "r_x2": 266.739, "r_y2": 475.524, "r_x3": 50.112, "r_y3": 475.524, "coord_origin": "TOPLEFT"}, "text": "structure, 3) the table style and 4) the type of content.", "orig": "structure, 3) the table style and 4) the type of content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.873, "r_y0": 484.076, "r_x1": 286.365, "r_y1": 484.076, "r_x2": 286.365, "r_y2": 475.524, "r_x3": 270.873, "r_y3": 475.524, "coord_origin": "TOPLEFT"}, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 496.031, "r_x1": 286.365, "r_y1": 496.031, "r_x2": 286.365, "r_y2": 487.479, "r_x3": 50.112, "r_y3": 487.479, "coord_origin": "TOPLEFT"}, "text": "complexity of the table structure is described by the size of", "orig": "complexity of the table structure is described by the size of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 507.986, "r_x1": 286.365, "r_y1": 507.986, "r_x2": 286.365, "r_y2": 499.434, "r_x3": 50.112, "r_y3": 499.434, "coord_origin": "TOPLEFT"}, "text": "the table header and the table body, as well as the percentage", "orig": "the table header and the table body, as well as the percentage", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 519.941, "r_x1": 286.365, "r_y1": 519.941, "r_x2": 286.365, "r_y2": 511.389, "r_x3": 50.112, "r_y3": 511.389, "coord_origin": "TOPLEFT"}, "text": "of the table cells covered by row spans and column spans.", "orig": "of the table cells covered by row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 531.8969999999999, "r_x1": 286.365, "r_y1": 531.8969999999999, "r_x2": 286.365, "r_y2": 523.345, "r_x3": 50.112, "r_y3": 523.345, "coord_origin": "TOPLEFT"}, "text": "A set of carefully designed styling templates provides the", "orig": "A set of carefully designed styling templates provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 543.852, "r_x1": 286.365, "r_y1": 543.852, "r_x2": 286.365, "r_y2": 535.3, "r_x3": 50.112, "r_y3": 535.3, "coord_origin": "TOPLEFT"}, "text": "basis to build a wide range of table appearances. Lastly, the", "orig": "basis to build a wide range of table appearances. Lastly, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 555.807, "r_x1": 286.365, "r_y1": 555.807, "r_x2": 286.365, "r_y2": 547.255, "r_x3": 50.112, "r_y3": 547.255, "coord_origin": "TOPLEFT"}, "text": "table content is generated out of a curated collection of text", "orig": "table content is generated out of a curated collection of text", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 567.762, "r_x1": 83.028, "r_y1": 567.762, "r_x2": 83.028, "r_y2": 559.21, "r_x3": 50.112, "r_y3": 559.21, "coord_origin": "TOPLEFT"}, "text": "corpora.", "orig": "corpora.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.153, "r_y0": 567.762, "r_x1": 286.365, "r_y1": 567.762, "r_x2": 286.365, "r_y2": 559.21, "r_x3": 87.153, "r_y3": 559.21, "coord_origin": "TOPLEFT"}, "text": "By controlling the size and scope of the synthetic", "orig": "By controlling the size and scope of the synthetic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 579.717, "r_x1": 286.365, "r_y1": 579.717, "r_x2": 286.365, "r_y2": 571.165, "r_x3": 50.112, "r_y3": 571.165, "coord_origin": "TOPLEFT"}, "text": "datasets we are able to train and evaluate our models in a", "orig": "datasets we are able to train and evaluate our models in a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 591.672, "r_x1": 174.645, "r_y1": 591.672, "r_x2": 174.645, "r_y2": 583.12, "r_x3": 50.112, "r_y3": 583.12, "coord_origin": "TOPLEFT"}, "text": "variety of different conditions.", "orig": "variety of different conditions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.021, "r_y0": 591.672, "r_x1": 286.365, "r_y1": 591.672, "r_x2": 286.365, "r_y2": 583.12, "r_x3": 181.021, "r_y3": 583.12, "coord_origin": "TOPLEFT"}, "text": "For example, we can first", "orig": "For example, we can first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 603.6279999999999, "r_x1": 286.365, "r_y1": 603.6279999999999, "r_x2": 286.365, "r_y2": 595.076, "r_x3": 50.112, "r_y3": 595.076, "coord_origin": "TOPLEFT"}, "text": "generate a highly diverse dataset to train our models and", "orig": "generate a highly diverse dataset to train our models and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 615.583, "r_x1": 286.365, "r_y1": 615.583, "r_x2": 286.365, "r_y2": 607.031, "r_x3": 50.112, "r_y3": 607.031, "coord_origin": "TOPLEFT"}, "text": "then evaluate their performance on other synthetic datasets", "orig": "then evaluate their performance on other synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 627.538, "r_x1": 209.753, "r_y1": 627.538, "r_x2": 209.753, "r_y2": 618.986, "r_x3": 50.112, "r_y3": 618.986, "coord_origin": "TOPLEFT"}, "text": "which are focused on a specific domain.", "orig": "which are focused on a specific domain.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Motivated by those observations we aimed at generating a synthetic table dataset named SynthTabNet . This approach offers control over: 1) the size of the dataset, 2) the table structure, 3) the table style and 4) the type of content. The complexity of the table structure is described by the size of the table header and the table body, as well as the percentage of the table cells covered by row spans and column spans. A set of carefully designed styling templates provides the basis to build a wide range of table appearances. Lastly, the table content is generated out of a curated collection of text corpora. By controlling the size and scope of the synthetic datasets we are able to train and evaluate our models in a variety of different conditions. For example, we can first generate a highly diverse dataset to train our models and then evaluate their performance on other synthetic datasets which are focused on a specific domain."}, {"label": "text", "id": 5, "page_no": 3, "cluster": {"id": 5, "label": "text", "bbox": {"l": 50.112, "t": 632.783, "r": 286.365, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9871614575386047, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 641.335, "r_x1": 286.365, "r_y1": 641.335, "r_x2": 286.365, "r_y2": 632.783, "r_x3": 62.067, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "In this regard, we have prepared four synthetic datasets,", "orig": "In this regard, we have prepared four synthetic datasets,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 653.29, "r_x1": 286.365, "r_y1": 653.29, "r_x2": 286.365, "r_y2": 644.738, "r_x3": 50.112, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "each one containing 150k examples. The corpora to gener-", "orig": "each one containing 150k examples. The corpora to gener-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 665.246, "r_x1": 286.365, "r_y1": 665.246, "r_x2": 286.365, "r_y2": 656.694, "r_x3": 50.112, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "ate the table text consists of the most frequent terms appear-", "orig": "ate the table text consists of the most frequent terms appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.201, "r_x1": 286.365, "r_y1": 677.201, "r_x2": 286.365, "r_y2": 668.649, "r_x3": 50.112, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "ing in PubTabNet and FinTabNet together with randomly", "orig": "ing in PubTabNet and FinTabNet together with randomly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 109.519, "r_y1": 689.156, "r_x2": 109.519, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "generated text.", "orig": "generated text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 115.337, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 115.337, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "The first two synthetic datasets have been", "orig": "The first two synthetic datasets have been", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "fine-tuned to mimic the appearance of the original datasets", "orig": "fine-tuned to mimic the appearance of the original datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "but encompass more complicated table structures. The third", "orig": "but encompass more complicated table structures. The third", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In this regard, we have prepared four synthetic datasets, each one containing 150k examples. The corpora to generate the table text consists of the most frequent terms appearing in PubTabNet and FinTabNet together with randomly generated text. The first two synthetic datasets have been fine-tuned to mimic the appearance of the original datasets but encompass more complicated table structures. The third"}, {"label": "table", "id": 8, "page_no": 3, "cluster": {"id": 8, "label": "table", "bbox": {"l": 310.67584228515625, "t": 73.19388580322266, "r": 542.9547119140625, "b": 155.22052001953125, "coord_origin": "TOPLEFT"}, "confidence": 0.9777463674545288, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.332, "r_y0": 82.43499999999995, "r_x1": 430.902, "r_y1": 82.43499999999995, "r_x2": 430.902, "r_y2": 73.88300000000004, "r_x3": 412.332, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.857, "r_y0": 82.43499999999995, "r_x1": 464.446, "r_y1": 82.43499999999995, "r_x2": 464.446, "r_y2": 73.88300000000004, "r_x3": 442.857, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.786, "r_y0": 82.43499999999995, "r_x1": 494.942, "r_y1": 82.43499999999995, "r_x2": 494.942, "r_y2": 73.88300000000004, "r_x3": 477.786, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 508.282, "r_y0": 82.43499999999995, "r_x1": 536.914, "r_y1": 82.43499999999995, "r_x2": 536.914, "r_y2": 73.88300000000004, "r_x3": 508.282, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 94.78800000000001, "r_x1": 361.643, "r_y1": 94.78800000000001, "r_x2": 361.643, "r_y2": 86.23599999999999, "r_x3": 317.06, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 92.72199999999998, "r_x1": 425.378, "r_y1": 92.72199999999998, "r_x2": 425.378, "r_y2": 85.668, "r_x3": 417.856, "r_y3": 85.668, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 92.72199999999998, "r_x1": 457.417, "r_y1": 92.72199999999998, "r_x2": 457.417, "r_y2": 85.668, "r_x3": 449.896, "r_y3": 85.668, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 94.78800000000001, "r_x1": 496.326, "r_y1": 94.78800000000001, "r_x2": 496.326, "r_y2": 86.23599999999999, "r_x3": 476.401, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 94.78800000000001, "r_x1": 532.56, "r_y1": 94.78800000000001, "r_x2": 532.56, "r_y2": 86.23599999999999, "r_x3": 512.635, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 106.74300000000005, "r_x1": 359.431, "r_y1": 106.74300000000005, "r_x2": 359.431, "r_y2": 98.19100000000003, "r_x3": 317.06, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 104.67700000000002, "r_x1": 425.378, "r_y1": 104.67700000000002, "r_x2": 425.378, "r_y2": 97.62300000000005, "r_x3": 417.856, "r_y3": 97.62300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 104.67700000000002, "r_x1": 457.417, "r_y1": 104.67700000000002, "r_x2": 457.417, "r_y2": 97.62300000000005, "r_x3": 449.896, "r_y3": 97.62300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 106.74300000000005, "r_x1": 496.326, "r_y1": 106.74300000000005, "r_x2": 496.326, "r_y2": 98.19100000000003, "r_x3": 476.401, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.462, "r_y0": 106.74300000000005, "r_x1": 531.733, "r_y1": 106.74300000000005, "r_x2": 531.733, "r_y2": 98.19100000000003, "r_x3": 513.462, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 118.69899999999996, "r_x1": 359.979, "r_y1": 118.69899999999996, "r_x2": 359.979, "r_y2": 110.14700000000005, "r_x3": 317.06, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 116.63300000000004, "r_x1": 425.378, "r_y1": 116.63300000000004, "r_x2": 425.378, "r_y2": 109.57899999999995, "r_x3": 417.856, "r_y3": 109.57899999999995, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.812, "r_y0": 116.63300000000004, "r_x1": 456.501, "r_y1": 116.63300000000004, "r_x2": 456.501, "r_y2": 109.57899999999995, "r_x3": 450.812, "r_y3": 109.57899999999995, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 118.69899999999996, "r_x1": 496.326, "r_y1": 118.69899999999996, "r_x2": 496.326, "r_y2": 110.14700000000005, "r_x3": 476.401, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 511.25, "r_y0": 118.69899999999996, "r_x1": 533.945, "r_y1": 118.69899999999996, "r_x2": 533.945, "r_y2": 110.14700000000005, "r_x3": 511.25, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 130.654, "r_x1": 400.377, "r_y1": 130.654, "r_x2": 400.377, "r_y2": 122.10199999999998, "r_x3": 317.06, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 128.58799999999997, "r_x1": 425.378, "r_y1": 128.58799999999997, "r_x2": 425.378, "r_y2": 121.53399999999999, "r_x3": 417.856, "r_y3": 121.53399999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 128.58799999999997, "r_x1": 457.417, "r_y1": 128.58799999999997, "r_x2": 457.417, "r_y2": 121.53399999999999, "r_x3": 449.896, "r_y3": 121.53399999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 130.654, "r_x1": 496.326, "r_y1": 130.654, "r_x2": 496.326, "r_y2": 122.10199999999998, "r_x3": 476.401, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 130.654, "r_x1": 532.56, "r_y1": 130.654, "r_x2": 532.56, "r_y2": 122.10199999999998, "r_x3": 512.635, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 142.60900000000004, "r_x1": 375.172, "r_y1": 142.60900000000004, "r_x2": 375.172, "r_y2": 134.05700000000002, "r_x3": 317.06, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 140.543, "r_x1": 425.378, "r_y1": 140.543, "r_x2": 425.378, "r_y2": 133.48900000000003, "r_x3": 417.856, "r_y3": 133.48900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 140.543, "r_x1": 457.417, "r_y1": 140.543, "r_x2": 457.417, "r_y2": 133.48900000000003, "r_x3": 449.896, "r_y3": 133.48900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 142.60900000000004, "r_x1": 496.326, "r_y1": 142.60900000000004, "r_x2": 496.326, "r_y2": 134.05700000000002, "r_x3": 476.401, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 142.60900000000004, "r_x1": 532.56, "r_y1": 142.60900000000004, "r_x2": 532.56, "r_y2": 134.05700000000002, "r_x3": 512.635, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 154.56399999999996, "r_x1": 369.394, "r_y1": 154.56399999999996, "r_x2": 369.394, "r_y2": 146.01199999999994, "r_x3": 317.06, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 152.49800000000005, "r_x1": 425.378, "r_y1": 152.49800000000005, "r_x2": 425.378, "r_y2": 145.44399999999996, "r_x3": 417.856, "r_y3": 145.44399999999996, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 152.49800000000005, "r_x1": 457.417, "r_y1": 152.49800000000005, "r_x2": 457.417, "r_y2": 145.44399999999996, "r_x3": 449.896, "r_y3": 145.44399999999996, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 154.56399999999996, "r_x1": 496.326, "r_y1": 154.56399999999996, "r_x2": 496.326, "r_y2": 146.01199999999994, "r_x3": 476.401, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 154.56399999999996, "r_x1": 532.56, "r_y1": 154.56399999999996, "r_x2": 532.56, "r_y2": 146.01199999999994, "r_x3": 512.635, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 17, "label": "text", "bbox": {"l": 412.332, "t": 73.88300000000004, "r": 430.902, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 412.332, "r_y0": 82.43499999999995, "r_x1": 430.902, "r_y1": 82.43499999999995, "r_x2": 430.902, "r_y2": 73.88300000000004, "r_x3": 412.332, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Tags", "orig": "Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 442.857, "t": 73.88300000000004, "r": 464.446, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.857, "r_y0": 82.43499999999995, "r_x1": 464.446, "r_y1": 82.43499999999995, "r_x2": 464.446, "r_y2": 73.88300000000004, "r_x3": 442.857, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Bbox", "orig": "Bbox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 477.786, "t": 73.88300000000004, "r": 494.942, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.786, "r_y0": 82.43499999999995, "r_x1": 494.942, "r_y1": 82.43499999999995, "r_x2": 494.942, "r_y2": 73.88300000000004, "r_x3": 477.786, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Size", "orig": "Size", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 508.282, "t": 73.88300000000004, "r": 536.914, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 508.282, "r_y0": 82.43499999999995, "r_x1": 536.914, "r_y1": 82.43499999999995, "r_x2": 536.914, "r_y2": 73.88300000000004, "r_x3": 508.282, "r_y3": 73.88300000000004, "coord_origin": "TOPLEFT"}, "text": "Format", "orig": "Format", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 317.06, "t": 86.23599999999999, "r": 361.643, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 94.78800000000001, "r_x1": 361.643, "r_y1": 94.78800000000001, "r_x2": 361.643, "r_y2": 86.23599999999999, "r_x3": 317.06, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 417.856, "t": 85.668, "r": 425.378, "b": 92.72199999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 92.72199999999998, "r_x1": 425.378, "r_y1": 92.72199999999998, "r_x2": 425.378, "r_y2": 85.668, "r_x3": 417.856, "r_y3": 85.668, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 449.896, "t": 85.668, "r": 457.417, "b": 92.72199999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 92.72199999999998, "r_x1": 457.417, "r_y1": 92.72199999999998, "r_x2": 457.417, "r_y2": 85.668, "r_x3": 449.896, "r_y3": 85.668, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 476.401, "t": 86.23599999999999, "r": 496.326, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 94.78800000000001, "r_x1": 496.326, "r_y1": 94.78800000000001, "r_x2": 496.326, "r_y2": 86.23599999999999, "r_x3": 476.401, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "509k", "orig": "509k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 512.635, "t": 86.23599999999999, "r": 532.56, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 94.78800000000001, "r_x1": 532.56, "r_y1": 94.78800000000001, "r_x2": 532.56, "r_y2": 86.23599999999999, "r_x3": 512.635, "r_y3": 86.23599999999999, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 317.06, "t": 98.19100000000003, "r": 359.431, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 106.74300000000005, "r_x1": 359.431, "r_y1": 106.74300000000005, "r_x2": 359.431, "r_y2": 98.19100000000003, "r_x3": 317.06, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 417.856, "t": 97.62300000000005, "r": 425.378, "b": 104.67700000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 104.67700000000002, "r_x1": 425.378, "r_y1": 104.67700000000002, "r_x2": 425.378, "r_y2": 97.62300000000005, "r_x3": 417.856, "r_y3": 97.62300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 449.896, "t": 97.62300000000005, "r": 457.417, "b": 104.67700000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 104.67700000000002, "r_x1": 457.417, "r_y1": 104.67700000000002, "r_x2": 457.417, "r_y2": 97.62300000000005, "r_x3": 449.896, "r_y3": 97.62300000000005, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 476.401, "t": 98.19100000000003, "r": 496.326, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 106.74300000000005, "r_x1": 496.326, "r_y1": 106.74300000000005, "r_x2": 496.326, "r_y2": 98.19100000000003, "r_x3": 476.401, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "112k", "orig": "112k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 513.462, "t": 98.19100000000003, "r": 531.733, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.462, "r_y0": 106.74300000000005, "r_x1": 531.733, "r_y1": 106.74300000000005, "r_x2": 531.733, "r_y2": 98.19100000000003, "r_x3": 513.462, "r_y3": 98.19100000000003, "coord_origin": "TOPLEFT"}, "text": "PDF", "orig": "PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 317.06, "t": 110.14700000000005, "r": 359.979, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 118.69899999999996, "r_x1": 359.979, "r_y1": 118.69899999999996, "r_x2": 359.979, "r_y2": 110.14700000000005, "r_x3": 317.06, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "TableBank", "orig": "TableBank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 417.856, "t": 109.57899999999995, "r": 425.378, "b": 116.63300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 116.63300000000004, "r_x1": 425.378, "r_y1": 116.63300000000004, "r_x2": 425.378, "r_y2": 109.57899999999995, "r_x3": 417.856, "r_y3": 109.57899999999995, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 450.812, "t": 109.57899999999995, "r": 456.501, "b": 116.63300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.812, "r_y0": 116.63300000000004, "r_x1": 456.501, "r_y1": 116.63300000000004, "r_x2": 456.501, "r_y2": 109.57899999999995, "r_x3": 450.812, "r_y3": 109.57899999999995, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 476.401, "t": 110.14700000000005, "r": 496.326, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 118.69899999999996, "r_x1": 496.326, "r_y1": 118.69899999999996, "r_x2": 496.326, "r_y2": 110.14700000000005, "r_x3": 476.401, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "145k", "orig": "145k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 511.25, "t": 110.14700000000005, "r": 533.945, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 511.25, "r_y0": 118.69899999999996, "r_x1": 533.945, "r_y1": 118.69899999999996, "r_x2": 533.945, "r_y2": 110.14700000000005, "r_x3": 511.25, "r_y3": 110.14700000000005, "coord_origin": "TOPLEFT"}, "text": "JPEG", "orig": "JPEG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 317.06, "t": 122.10199999999998, "r": 400.377, "b": 130.654, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 130.654, "r_x1": 400.377, "r_y1": 130.654, "r_x2": 400.377, "r_y2": 122.10199999999998, "r_x3": 317.06, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "Combined-Tabnet(*)", "orig": "Combined-Tabnet(*)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 417.856, "t": 121.53399999999999, "r": 425.378, "b": 128.58799999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 128.58799999999997, "r_x1": 425.378, "r_y1": 128.58799999999997, "r_x2": 425.378, "r_y2": 121.53399999999999, "r_x3": 417.856, "r_y3": 121.53399999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 449.896, "t": 121.53399999999999, "r": 457.417, "b": 128.58799999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 128.58799999999997, "r_x1": 457.417, "r_y1": 128.58799999999997, "r_x2": 457.417, "r_y2": 121.53399999999999, "r_x3": 449.896, "r_y3": 121.53399999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 476.401, "t": 122.10199999999998, "r": 496.326, "b": 130.654, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 130.654, "r_x1": 496.326, "r_y1": 130.654, "r_x2": 496.326, "r_y2": 122.10199999999998, "r_x3": 476.401, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "400k", "orig": "400k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 512.635, "t": 122.10199999999998, "r": 532.56, "b": 130.654, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 130.654, "r_x1": 532.56, "r_y1": 130.654, "r_x2": 532.56, "r_y2": 122.10199999999998, "r_x3": 512.635, "r_y3": 122.10199999999998, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 317.06, "t": 134.05700000000002, "r": 375.172, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 142.60900000000004, "r_x1": 375.172, "r_y1": 142.60900000000004, "r_x2": 375.172, "r_y2": 134.05700000000002, "r_x3": 317.06, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "Combined(**)", "orig": "Combined(**)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 417.856, "t": 133.48900000000003, "r": 425.378, "b": 140.543, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 140.543, "r_x1": 425.378, "r_y1": 140.543, "r_x2": 425.378, "r_y2": 133.48900000000003, "r_x3": 417.856, "r_y3": 133.48900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 449.896, "t": 133.48900000000003, "r": 457.417, "b": 140.543, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 140.543, "r_x1": 457.417, "r_y1": 140.543, "r_x2": 457.417, "r_y2": 133.48900000000003, "r_x3": 449.896, "r_y3": 133.48900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 476.401, "t": 134.05700000000002, "r": 496.326, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 142.60900000000004, "r_x1": 496.326, "r_y1": 142.60900000000004, "r_x2": 496.326, "r_y2": 134.05700000000002, "r_x3": 476.401, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "500k", "orig": "500k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 512.635, "t": 134.05700000000002, "r": 532.56, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 142.60900000000004, "r_x1": 532.56, "r_y1": 142.60900000000004, "r_x2": 532.56, "r_y2": 134.05700000000002, "r_x3": 512.635, "r_y3": 134.05700000000002, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 317.06, "t": 146.01199999999994, "r": 369.394, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 317.06, "r_y0": 154.56399999999996, "r_x1": 369.394, "r_y1": 154.56399999999996, "r_x2": 369.394, "r_y2": 146.01199999999994, "r_x3": 317.06, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 417.856, "t": 145.44399999999996, "r": 425.378, "b": 152.49800000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.856, "r_y0": 152.49800000000005, "r_x1": 425.378, "r_y1": 152.49800000000005, "r_x2": 425.378, "r_y2": 145.44399999999996, "r_x3": 417.856, "r_y3": 145.44399999999996, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 449.896, "t": 145.44399999999996, "r": 457.417, "b": 152.49800000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.896, "r_y0": 152.49800000000005, "r_x1": 457.417, "r_y1": 152.49800000000005, "r_x2": 457.417, "r_y2": 145.44399999999996, "r_x3": 449.896, "r_y3": 145.44399999999996, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 476.401, "t": 146.01199999999994, "r": 496.326, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.401, "r_y0": 154.56399999999996, "r_x1": 496.326, "r_y1": 154.56399999999996, "r_x2": 496.326, "r_y2": 146.01199999999994, "r_x3": 476.401, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "600k", "orig": "600k", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 512.635, "t": 146.01199999999994, "r": 532.56, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.635, "r_y0": 154.56399999999996, "r_x1": 532.56, "r_y1": 154.56399999999996, "r_x2": 532.56, "r_y2": 146.01199999999994, "r_x3": 512.635, "r_y3": 146.01199999999994, "coord_origin": "TOPLEFT"}, "text": "PNG", "orig": "PNG", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 7, "num_cols": 5, "table_cells": [{"bbox": {"l": 412.332, "t": 73.88300000000004, "r": 430.902, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Tags", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 442.857, "t": 73.88300000000004, "r": 464.446, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Bbox", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 477.786, "t": 73.88300000000004, "r": 494.942, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "Size", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 508.282, "t": 73.88300000000004, "r": 536.914, "b": 82.43499999999995, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "Format", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 317.06, "t": 86.23599999999999, "r": 361.643, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "PubTabNet", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 417.856, "t": 85.668, "r": 425.378, "b": 92.72199999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 449.896, "t": 85.668, "r": 457.417, "b": 92.72199999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 476.401, "t": 86.23599999999999, "r": 496.326, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "509k", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 512.635, "t": 86.23599999999999, "r": 532.56, "b": 94.78800000000001, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 317.06, "t": 98.19100000000003, "r": 359.431, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "FinTabNet", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 417.856, "t": 97.62300000000005, "r": 425.378, "b": 104.67700000000002, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 449.896, "t": 97.62300000000005, "r": 457.417, "b": 104.67700000000002, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 476.401, "t": 98.19100000000003, "r": 496.326, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "112k", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 513.462, "t": 98.19100000000003, "r": 531.733, "b": 106.74300000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PDF", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 317.06, "t": 110.14700000000005, "r": 359.979, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableBank", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 417.856, "t": 109.57899999999995, "r": 425.378, "b": 116.63300000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 450.812, "t": 109.57899999999995, "r": 456.501, "b": 116.63300000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "7", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 476.401, "t": 110.14700000000005, "r": 496.326, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "145k", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 511.25, "t": 110.14700000000005, "r": 533.945, "b": 118.69899999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "JPEG", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 317.06, "t": 122.10199999999998, "r": 400.377, "b": 130.654, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Combined-Tabnet(*)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 417.856, "t": 121.53399999999999, "r": 425.378, "b": 128.58799999999997, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 449.896, "t": 121.53399999999999, "r": 457.417, "b": 128.58799999999997, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 476.401, "t": 122.10199999999998, "r": 496.326, "b": 130.654, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "400k", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 512.635, "t": 122.10199999999998, "r": 532.56, "b": 130.654, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 317.06, "t": 134.05700000000002, "r": 375.172, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Combined(**)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 417.856, "t": 133.48900000000003, "r": 425.378, "b": 140.543, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 449.896, "t": 133.48900000000003, "r": 457.417, "b": 140.543, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 476.401, "t": 134.05700000000002, "r": 496.326, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "500k", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 512.635, "t": 134.05700000000002, "r": 532.56, "b": 142.60900000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 317.06, "t": 146.01199999999994, "r": 369.394, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "SynthTabNet", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 417.856, "t": 145.44399999999996, "r": 425.378, "b": 152.49800000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 449.896, "t": 145.44399999999996, "r": 457.417, "b": 152.49800000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 476.401, "t": 146.01199999999994, "r": 496.326, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "600k", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 512.635, "t": 146.01199999999994, "r": 532.56, "b": 154.56399999999996, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PNG", "column_header": false, "row_header": false, "row_section": false}]}, {"label": "caption", "id": 9, "page_no": 3, "cluster": {"id": 9, "label": "caption", "bbox": {"l": 308.862, "t": 167.75099999999998, "r": 545.115, "b": 224.303, "coord_origin": "TOPLEFT"}, "confidence": 0.9667726755142212, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 176.48199999999997, "r_x1": 330.75, "r_y1": 176.48199999999997, "r_x2": 330.75, "r_y2": 167.92999999999995, "r_x3": 308.862, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "Table", "orig": "Table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 336.867, "r_y0": 176.48199999999997, "r_x1": 344.618, "r_y1": 176.48199999999997, "r_x2": 344.618, "r_y2": 167.92999999999995, "r_x3": 336.867, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "1:", "orig": "1:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 361.076, "r_y0": 176.48199999999997, "r_x1": 380.453, "r_y1": 176.48199999999997, "r_x2": 380.453, "r_y2": 167.92999999999995, "r_x3": 361.076, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "Both", "orig": "Both", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.568, "r_y0": 176.33900000000006, "r_x1": 468.68, "r_y1": 176.33900000000006, "r_x2": 468.68, "r_y2": 167.75099999999998, "r_x3": 386.568, "r_y3": 167.75099999999998, "coord_origin": "TOPLEFT"}, "text": "'Combined-Tabnet'", "orig": "'Combined-Tabnet'", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 474.796, "r_y0": 176.48199999999997, "r_x1": 489.182, "r_y1": 176.48199999999997, "r_x2": 489.182, "r_y2": 167.92999999999995, "r_x3": 474.796, "r_y3": 167.92999999999995, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 495.299, "r_y0": 176.33900000000006, "r_x1": 545.112, "r_y1": 176.33900000000006, "r_x2": 545.112, "r_y2": 167.75099999999998, "r_x3": 495.299, "r_y3": 167.75099999999998, "coord_origin": "TOPLEFT"}, "text": "'Combined-", "orig": "'Combined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 188.29399999999998, "r_x1": 341.161, "r_y1": 188.29399999999998, "r_x2": 341.161, "r_y2": 179.70600000000002, "r_x3": 308.862, "r_y3": 179.70600000000002, "coord_origin": "TOPLEFT"}, "text": "Tabnet'", "orig": "Tabnet'", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 343.457, "r_y0": 188.437, "r_x1": 545.11, "r_y1": 188.437, "r_x2": 545.11, "r_y2": 179.885, "r_x3": 343.457, "r_y3": 179.885, "coord_origin": "TOPLEFT"}, "text": "are variations of the following: (*) The Combined-", "orig": "are variations of the following: (*) The Combined-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 200.39200000000005, "r_x1": 545.115, "r_y1": 200.39200000000005, "r_x2": 545.115, "r_y2": 191.84000000000003, "r_x3": 308.862, "r_y3": 191.84000000000003, "coord_origin": "TOPLEFT"}, "text": "Tabnet dataset is the processed combination of PubTabNet", "orig": "Tabnet dataset is the processed combination of PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 212.34699999999998, "r_x1": 366.276, "r_y1": 212.34699999999998, "r_x2": 366.276, "r_y2": 203.79499999999996, "r_x3": 308.862, "r_y3": 203.79499999999996, "coord_origin": "TOPLEFT"}, "text": "and Fintabnet.", "orig": "and Fintabnet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 370.58, "r_y0": 212.34699999999998, "r_x1": 545.115, "r_y1": 212.34699999999998, "r_x2": 545.115, "r_y2": 203.79499999999996, "r_x3": 370.58, "r_y3": 203.79499999999996, "coord_origin": "TOPLEFT"}, "text": "(**) The combined dataset is the processed", "orig": "(**) The combined dataset is the processed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 224.303, "r_x1": 523.935, "r_y1": 224.303, "r_x2": 523.935, "r_y2": 215.75099999999998, "r_x3": 308.862, "r_y3": 215.75099999999998, "coord_origin": "TOPLEFT"}, "text": "combination of PubTabNet, Fintabnet and TableBank.", "orig": "combination of PubTabNet, Fintabnet and TableBank.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table 1: Both 'Combined-Tabnet' and 'CombinedTabnet' are variations of the following: (*) The CombinedTabnet dataset is the processed combination of PubTabNet and Fintabnet. (**) The combined dataset is the processed combination of PubTabNet, Fintabnet and TableBank."}, {"label": "text", "id": 6, "page_no": 3, "cluster": {"id": 6, "label": "text", "bbox": {"l": 308.862, "t": 249.889, "r": 545.115, "b": 294.306, "coord_origin": "TOPLEFT"}, "confidence": 0.978954017162323, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.44100000000003, "r_x1": 545.115, "r_y1": 258.44100000000003, "r_x2": 545.115, "r_y2": 249.889, "r_x3": 308.862, "r_y3": 249.889, "coord_origin": "TOPLEFT"}, "text": "one adopts a colorful appearance with high contrast and the", "orig": "one adopts a colorful appearance with high contrast and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 270.39599999999996, "r_x1": 545.115, "r_y1": 270.39599999999996, "r_x2": 545.115, "r_y2": 261.84400000000005, "r_x3": 308.862, "r_y3": 261.84400000000005, "coord_origin": "TOPLEFT"}, "text": "last one contains tables with sparse content. Lastly, we have", "orig": "last one contains tables with sparse content. Lastly, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 282.351, "r_x1": 545.115, "r_y1": 282.351, "r_x2": 545.115, "r_y2": 273.799, "r_x3": 308.862, "r_y3": 273.799, "coord_origin": "TOPLEFT"}, "text": "combined all synthetic datasets into one big unified syn-", "orig": "combined all synthetic datasets into one big unified syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 294.306, "r_x1": 436.822, "r_y1": 294.306, "r_x2": 436.822, "r_y2": 285.754, "r_x3": 308.862, "r_y3": 285.754, "coord_origin": "TOPLEFT"}, "text": "thetic dataset of 600k examples.", "orig": "thetic dataset of 600k examples.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "one adopts a colorful appearance with high contrast and the last one contains tables with sparse content. Lastly, we have combined all synthetic datasets into one big unified synthetic dataset of 600k examples."}, {"label": "text", "id": 13, "page_no": 3, "cluster": {"id": 13, "label": "text", "bbox": {"l": 320.817, "t": 298.041, "r": 542.744, "b": 306.593, "coord_origin": "TOPLEFT"}, "confidence": 0.9043695330619812, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 306.593, "r_x1": 542.744, "r_y1": 306.593, "r_x2": 542.744, "r_y2": 298.041, "r_x3": 320.817, "r_y3": 298.041, "coord_origin": "TOPLEFT"}, "text": "Tab. 1 summarizes the various attributes of the datasets.", "orig": "Tab. 1 summarizes the various attributes of the datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Tab. 1 summarizes the various attributes of the datasets."}, {"label": "section_header", "id": 11, "page_no": 3, "cluster": {"id": 11, "label": "section_header", "bbox": {"l": 308.862, "t": 321.184, "r": 444.936, "b": 331.932, "coord_origin": "TOPLEFT"}, "confidence": 0.9466595649719238, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 331.932, "r_x1": 444.936, "r_y1": 331.932, "r_x2": 444.936, "r_y2": 321.184, "r_x3": 308.862, "r_y3": 321.184, "coord_origin": "TOPLEFT"}, "text": "4. The TableFormer model", "orig": "4. The TableFormer model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4. The TableFormer model"}, {"label": "text", "id": 0, "page_no": 3, "cluster": {"id": 0, "label": "text", "bbox": {"l": 308.862, "t": 342.208, "r": 545.115, "b": 446.401, "coord_origin": "TOPLEFT"}, "confidence": 0.9884450435638428, "cells": [{"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 350.76, "r_x1": 545.115, "r_y1": 350.76, "r_x2": 545.115, "r_y2": 342.208, "r_x3": 320.817, "r_y3": 342.208, "coord_origin": "TOPLEFT"}, "text": "Given the image of a table, TableFormer is able to pre-", "orig": "Given the image of a table, TableFormer is able to pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 362.715, "r_x1": 326.576, "r_y1": 362.715, "r_x2": 326.576, "r_y2": 354.163, "r_x3": 308.862, "r_y3": 354.163, "coord_origin": "TOPLEFT"}, "text": "dict:", "orig": "dict:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.172, "r_y0": 362.715, "r_x1": 545.115, "r_y1": 362.715, "r_x2": 545.115, "r_y2": 354.163, "r_x3": 330.172, "r_y3": 354.163, "coord_origin": "TOPLEFT"}, "text": "1) a sequence of tokens that represent the structure of", "orig": "1) a sequence of tokens that represent the structure of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 374.67, "r_x1": 545.115, "r_y1": 374.67, "r_x2": 545.115, "r_y2": 366.118, "r_x3": 308.862, "r_y3": 366.118, "coord_origin": "TOPLEFT"}, "text": "a table, and 2) a bounding box coupled to a subset of those", "orig": "a table, and 2) a bounding box coupled to a subset of those", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 386.625, "r_x1": 337.265, "r_y1": 386.625, "r_x2": 337.265, "r_y2": 378.073, "r_x3": 308.862, "r_y3": 378.073, "coord_origin": "TOPLEFT"}, "text": "tokens.", "orig": "tokens.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.808, "r_y0": 386.625, "r_x1": 545.115, "r_y1": 386.625, "r_x2": 545.115, "r_y2": 378.073, "r_x3": 341.808, "r_y3": 378.073, "coord_origin": "TOPLEFT"}, "text": "The conversion of an image into a sequence of to-", "orig": "The conversion of an image into a sequence of to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 398.58, "r_x1": 545.115, "r_y1": 398.58, "r_x2": 545.115, "r_y2": 390.028, "r_x3": 308.862, "r_y3": 390.028, "coord_origin": "TOPLEFT"}, "text": "kens is a well-known task [35, 16]. While attention is often", "orig": "kens is a well-known task [35, 16]. While attention is often", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 410.535, "r_x1": 545.115, "r_y1": 410.535, "r_x2": 545.115, "r_y2": 401.983, "r_x3": 308.862, "r_y3": 401.983, "coord_origin": "TOPLEFT"}, "text": "used as an implicit method to associate each token of the", "orig": "used as an implicit method to associate each token of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 422.491, "r_x1": 545.115, "r_y1": 422.491, "r_x2": 545.115, "r_y2": 413.939, "r_x3": 308.862, "r_y3": 413.939, "coord_origin": "TOPLEFT"}, "text": "sequence with a position in the original image, an explicit", "orig": "sequence with a position in the original image, an explicit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 434.446, "r_x1": 545.115, "r_y1": 434.446, "r_x2": 545.115, "r_y2": 425.894, "r_x3": 308.862, "r_y3": 425.894, "coord_origin": "TOPLEFT"}, "text": "association between the individual table-cells and the image", "orig": "association between the individual table-cells and the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 446.401, "r_x1": 437.937, "r_y1": 446.401, "r_x2": 437.937, "r_y2": 437.849, "r_x3": 308.862, "r_y3": 437.849, "coord_origin": "TOPLEFT"}, "text": "bounding boxes is also required.", "orig": "bounding boxes is also required.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Given the image of a table, TableFormer is able to predict: 1) a sequence of tokens that represent the structure of a table, and 2) a bounding box coupled to a subset of those tokens. The conversion of an image into a sequence of tokens is a well-known task [35, 16]. While attention is often used as an implicit method to associate each token of the sequence with a position in the original image, an explicit association between the individual table-cells and the image bounding boxes is also required."}, {"label": "section_header", "id": 12, "page_no": 3, "cluster": {"id": 12, "label": "section_header", "bbox": {"l": 308.862, "t": 457.694, "r": 420.161, "b": 467.546, "coord_origin": "TOPLEFT"}, "confidence": 0.937696099281311, "cells": [{"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 467.546, "r_x1": 420.161, "r_y1": 467.546, "r_x2": 420.161, "r_y2": 457.694, "r_x3": 308.862, "r_y3": 457.694, "coord_origin": "TOPLEFT"}, "text": "4.1. Model architecture.", "orig": "4.1. Model architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4.1. Model architecture."}, {"label": "text", "id": 2, "page_no": 3, "cluster": {"id": 2, "label": "text", "bbox": {"l": 308.862, "t": 477.034, "r": 545.116, "b": 664.914, "coord_origin": "TOPLEFT"}, "confidence": 0.9878323078155518, "cells": [{"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 485.586, "r_x1": 545.115, "r_y1": 485.586, "r_x2": 545.115, "r_y2": 477.034, "r_x3": 320.817, "r_y3": 477.034, "coord_origin": "TOPLEFT"}, "text": "We now describe in detail the proposed method, which", "orig": "We now describe in detail the proposed method, which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 497.541, "r_x1": 315.507, "r_y1": 497.541, "r_x2": 315.507, "r_y2": 488.989, "r_x3": 308.862, "r_y3": 488.989, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 319.153, "r_y0": 497.541, "r_x1": 509.021, "r_y1": 497.541, "r_x2": 509.021, "r_y2": 488.989, "r_x3": 319.153, "r_y3": 488.989, "coord_origin": "TOPLEFT"}, "text": "composed of three main components, see Fig.", "orig": "composed of three main components, see Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.586, "r_y0": 497.541, "r_x1": 523.058, "r_y1": 497.541, "r_x2": 523.058, "r_y2": 488.989, "r_x3": 515.586, "r_y3": 488.989, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 529.623, "r_y0": 497.541, "r_x1": 545.115, "r_y1": 497.541, "r_x2": 545.115, "r_y2": 488.989, "r_x3": 529.623, "r_y3": 488.989, "coord_origin": "TOPLEFT"}, "text": "Our", "orig": "Our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 509.353, "r_x1": 406.346, "r_y1": 509.353, "r_x2": 406.346, "r_y2": 500.765, "r_x3": 308.862, "r_y3": 500.765, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.872, "r_y0": 509.496, "r_x1": 545.111, "r_y1": 509.496, "r_x2": 545.111, "r_y2": 500.944, "r_x3": 408.872, "r_y3": 500.944, "coord_origin": "TOPLEFT"}, "text": "encodes the input as a feature vec-", "orig": "encodes the input as a feature vec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 521.452, "r_x1": 319.93, "r_y1": 521.452, "r_x2": 319.93, "r_y2": 512.9, "r_x3": 308.862, "r_y3": 512.9, "coord_origin": "TOPLEFT"}, "text": "tor", "orig": "tor", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.836, "r_y0": 521.452, "r_x1": 409.395, "r_y1": 521.452, "r_x2": 409.395, "r_y2": 512.9, "r_x3": 323.836, "r_y3": 512.9, "coord_origin": "TOPLEFT"}, "text": "of predefined length.", "orig": "of predefined length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.727, "r_y0": 521.452, "r_x1": 545.115, "r_y1": 521.452, "r_x2": 545.115, "r_y2": 512.9, "r_x3": 416.727, "r_y3": 512.9, "coord_origin": "TOPLEFT"}, "text": "The input feature vector of the", "orig": "The input feature vector of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.4069999999999, "r_x1": 436.194, "r_y1": 533.4069999999999, "r_x2": 436.194, "r_y2": 524.855, "r_x3": 308.862, "r_y3": 524.855, "coord_origin": "TOPLEFT"}, "text": "encoded image is passed to the", "orig": "encoded image is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.526, "r_y0": 533.264, "r_x1": 513.867, "r_y1": 533.264, "r_x2": 513.867, "r_y2": 524.6759999999999, "r_x3": 439.526, "r_y3": 524.6759999999999, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 517.432, "r_y0": 533.4069999999999, "r_x1": 545.108, "r_y1": 533.4069999999999, "r_x2": 545.108, "r_y2": 524.855, "r_x3": 517.432, "r_y3": 524.855, "coord_origin": "TOPLEFT"}, "text": "to pro-", "orig": "to pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.362, "r_x1": 545.115, "r_y1": 545.362, "r_x2": 545.115, "r_y2": 536.81, "r_x3": 308.862, "r_y3": 536.81, "coord_origin": "TOPLEFT"}, "text": "duce a sequence of HTML tags that represent the structure", "orig": "duce a sequence of HTML tags that represent the structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 557.317, "r_x1": 358.545, "r_y1": 557.317, "r_x2": 358.545, "r_y2": 548.765, "r_x3": 308.862, "r_y3": 548.765, "coord_origin": "TOPLEFT"}, "text": "of the table.", "orig": "of the table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.191, "r_y0": 557.317, "r_x1": 545.115, "r_y1": 557.317, "r_x2": 545.115, "r_y2": 548.765, "r_x3": 365.191, "r_y3": 548.765, "coord_origin": "TOPLEFT"}, "text": "With each prediction of an HTML standard", "orig": "With each prediction of an HTML standard", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.2719999999999, "r_x1": 352.409, "r_y1": 569.2719999999999, "r_x2": 352.409, "r_y2": 560.72, "r_x3": 308.862, "r_y3": 560.72, "coord_origin": "TOPLEFT"}, "text": "data cell ('", "orig": "data cell ('", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 352.409, "r_y0": 569.108, "r_x1": 360.158, "r_y1": 569.108, "r_x2": 360.158, "r_y2": 560.402, "r_x3": 352.409, "r_y3": 560.402, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.158, "r_y0": 569.2719999999999, "r_x1": 367.909, "r_y1": 569.2719999999999, "r_x2": 367.909, "r_y2": 560.72, "r_x3": 360.158, "r_y3": 560.72, "coord_origin": "TOPLEFT"}, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.909, "r_y0": 569.108, "r_x1": 375.658, "r_y1": 569.108, "r_x2": 375.658, "r_y2": 560.402, "r_x3": 367.909, "r_y3": 560.402, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.658, "r_y0": 569.2719999999999, "r_x1": 545.112, "r_y1": 569.2719999999999, "r_x2": 545.112, "r_y2": 560.72, "r_x3": 375.658, "r_y3": 560.72, "coord_origin": "TOPLEFT"}, "text": "') the hidden state of that cell is passed to", "orig": "') the hidden state of that cell is passed to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 581.2280000000001, "r_x1": 545.115, "r_y1": 581.2280000000001, "r_x2": 545.115, "r_y2": 572.6759999999999, "r_x3": 308.862, "r_y3": 572.6759999999999, "coord_origin": "TOPLEFT"}, "text": "the Cell BBox Decoder. As for spanning cells, such as row", "orig": "the Cell BBox Decoder. As for spanning cells, such as row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 593.183, "r_x1": 483.118, "r_y1": 593.183, "r_x2": 483.118, "r_y2": 584.631, "r_x3": 308.862, "r_y3": 584.631, "coord_origin": "TOPLEFT"}, "text": "or column span, the tag is broken down to '", "orig": "or column span, the tag is broken down to '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.119, "r_y0": 593.019, "r_x1": 490.868, "r_y1": 593.019, "r_x2": 490.868, "r_y2": 584.313, "r_x3": 483.119, "r_y3": 584.313, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.868, "r_y0": 593.183, "r_x1": 545.114, "r_y1": 593.183, "r_x2": 545.114, "r_y2": 584.631, "r_x3": 490.868, "r_y3": 584.631, "coord_origin": "TOPLEFT"}, "text": "', 'rowspan='", "orig": "', 'rowspan='", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.138, "r_x1": 545.115, "r_y1": 605.138, "r_x2": 545.115, "r_y2": 596.586, "r_x3": 308.862, "r_y3": 596.586, "coord_origin": "TOPLEFT"}, "text": "or 'colspan=', with the number of spanning cells (attribute),", "orig": "or 'colspan=', with the number of spanning cells (attribute),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.093, "r_x1": 329.644, "r_y1": 617.093, "r_x2": 329.644, "r_y2": 608.5409999999999, "r_x3": 308.862, "r_y3": 608.5409999999999, "coord_origin": "TOPLEFT"}, "text": "and '", "orig": "and '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 329.646, "r_y0": 616.929, "r_x1": 337.395, "r_y1": 616.929, "r_x2": 337.395, "r_y2": 608.223, "r_x3": 329.646, "r_y3": 608.223, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.394, "r_y0": 617.093, "r_x1": 343.202, "r_y1": 617.093, "r_x2": 343.202, "r_y2": 608.5409999999999, "r_x3": 337.394, "r_y3": 608.5409999999999, "coord_origin": "TOPLEFT"}, "text": "'.", "orig": "'.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.064, "r_y0": 617.093, "r_x1": 468.591, "r_y1": 617.093, "r_x2": 468.591, "r_y2": 608.5409999999999, "r_x3": 348.064, "r_y3": 608.5409999999999, "coord_origin": "TOPLEFT"}, "text": "The hidden state attached to '", "orig": "The hidden state attached to '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.595, "r_y0": 616.929, "r_x1": 476.344, "r_y1": 616.929, "r_x2": 476.344, "r_y2": 608.223, "r_x3": 468.595, "r_y3": 608.223, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.344, "r_y0": 617.093, "r_x1": 545.116, "r_y1": 617.093, "r_x2": 545.116, "r_y2": 608.5409999999999, "r_x3": 476.344, "r_y3": 608.5409999999999, "coord_origin": "TOPLEFT"}, "text": "' is passed to the", "orig": "' is passed to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.048, "r_x1": 545.115, "r_y1": 629.048, "r_x2": 545.115, "r_y2": 620.496, "r_x3": 308.862, "r_y3": 620.496, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder. A shared feed forward network (FFN)", "orig": "Cell BBox Decoder. A shared feed forward network (FFN)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.0029999999999, "r_x1": 533.2, "r_y1": 641.0029999999999, "r_x2": 533.2, "r_y2": 632.451, "r_x3": 308.862, "r_y3": 632.451, "coord_origin": "TOPLEFT"}, "text": "receives the hidden states from the Structure Decoder,", "orig": "receives the hidden states from the Structure Decoder,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 537.364, "r_y0": 641.0029999999999, "r_x1": 545.115, "r_y1": 641.0029999999999, "r_x2": 545.115, "r_y2": 632.451, "r_x3": 537.364, "r_y3": 632.451, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 652.9590000000001, "r_x1": 545.115, "r_y1": 652.9590000000001, "r_x2": 545.115, "r_y2": 644.407, "r_x3": 308.862, "r_y3": 644.407, "coord_origin": "TOPLEFT"}, "text": "provide the final detection predictions of the bounding box", "orig": "provide the final detection predictions of the bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 664.914, "r_x1": 449.424, "r_y1": 664.914, "r_x2": 449.424, "r_y2": 656.362, "r_x3": 308.862, "r_y3": 656.362, "coord_origin": "TOPLEFT"}, "text": "coordinates and their classification.", "orig": "coordinates and their classification.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We now describe in detail the proposed method, which is composed of three main components, see Fig. 4. Our CNN Backbone Network encodes the input as a feature vector of predefined length. The input feature vector of the encoded image is passed to the Structure Decoder to produce a sequence of HTML tags that represent the structure of the table. With each prediction of an HTML standard data cell (' < td > ') the hidden state of that cell is passed to the Cell BBox Decoder. As for spanning cells, such as row or column span, the tag is broken down to ' < ', 'rowspan=' or 'colspan=', with the number of spanning cells (attribute), and ' > '. The hidden state attached to ' < ' is passed to the Cell BBox Decoder. A shared feed forward network (FFN) receives the hidden states from the Structure Decoder, to provide the final detection predictions of the bounding box coordinates and their classification."}, {"label": "text", "id": 7, "page_no": 3, "cluster": {"id": 7, "label": "text", "bbox": {"l": 308.862, "t": 668.261, "r": 545.115, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.978580117225647, "cells": [{"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 677.217, "r_x1": 431.91, "r_y1": 677.217, "r_x2": 431.91, "r_y2": 668.261, "r_x3": 320.817, "r_y3": 668.261, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network.", "orig": "CNN Backbone Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.499, "r_y0": 677.201, "r_x1": 545.113, "r_y1": 677.201, "r_x2": 545.113, "r_y2": 668.649, "r_x3": 439.499, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "A ResNet-18 CNN is the", "orig": "A ResNet-18 CNN is the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 308.862, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "backbone that receives the table image and encodes it as a", "orig": "backbone that receives the table image and encodes it as a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "vector of predefined length. The network has been modified", "orig": "vector of predefined length. The network has been modified", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "by removing the linear and pooling layer, as we are not per-", "orig": "by removing the linear and pooling layer, as we are not per-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "CNN Backbone Network. A ResNet-18 CNN is the backbone that receives the table image and encodes it as a vector of predefined length. The network has been modified by removing the linear and pooling layer, as we are not per-"}], "headers": [{"label": "page_footer", "id": 14, "page_no": 3, "cluster": {"id": 14, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8565718531608582, "cells": [{"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4"}]}}, {"page_no": 4, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 125.61699999999996, "r_x1": 84.524, "r_y1": 125.61699999999996, "r_x2": 84.524, "r_y2": 122.481, "r_x3": 81.688, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 125.61699999999996, "r_x1": 93.026, "r_y1": 125.61699999999996, "r_x2": 93.026, "r_y2": 122.481, "r_x3": 86.413, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 102.505, "r_y0": 118.42999999999995, "r_x1": 115.346, "r_y1": 118.42999999999995, "r_x2": 115.346, "r_y2": 115.293, "r_x3": 102.505, "r_y3": 115.293, "coord_origin": "TOPLEFT"}, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.14, "r_y0": 118.39200000000005, "r_x1": 93.292, "r_y1": 118.39200000000005, "r_x2": 93.292, "r_y2": 115.25599999999997, "r_x3": 82.14, "r_y3": 115.25599999999997, "coord_origin": "TOPLEFT"}, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 125.61699999999996, "r_x1": 104.312, "r_y1": 125.61699999999996, "r_x2": 104.312, "r_y2": 122.481, "r_x3": 96.748, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 130.92100000000005, "r_x1": 102.421, "r_y1": 130.92100000000005, "r_x2": 102.421, "r_y2": 127.78499999999997, "r_x3": 96.748, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 136.63300000000004, "r_x1": 104.312, "r_y1": 136.63300000000004, "r_x2": 104.312, "r_y2": 133.49699999999996, "r_x3": 96.748, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 142.34500000000003, "r_x1": 102.421, "r_y1": 142.34500000000003, "r_x2": 102.421, "r_y2": 139.20899999999995, "r_x3": 96.748, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 125.61699999999996, "r_x1": 116.144, "r_y1": 125.61699999999996, "r_x2": 116.144, "r_y2": 122.481, "r_x3": 110.661, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 130.92100000000005, "r_x1": 116.144, "r_y1": 130.92100000000005, "r_x2": 116.144, "r_y2": 127.78499999999997, "r_x3": 110.661, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 136.63300000000004, "r_x1": 116.144, "r_y1": 136.63300000000004, "r_x2": 116.144, "r_y2": 133.49699999999996, "r_x3": 110.661, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 142.34500000000003, "r_x1": 116.144, "r_y1": 142.34500000000003, "r_x2": 116.144, "r_y2": 139.20899999999995, "r_x3": 110.661, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 130.92100000000005, "r_x1": 84.524, "r_y1": 130.92100000000005, "r_x2": 84.524, "r_y2": 127.78499999999997, "r_x3": 81.688, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 130.92100000000005, "r_x1": 93.026, "r_y1": 130.92100000000005, "r_x2": 93.026, "r_y2": 127.78499999999997, "r_x3": 86.413, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 136.63300000000004, "r_x1": 84.524, "r_y1": 136.63300000000004, "r_x2": 84.524, "r_y2": 133.49699999999996, "r_x3": 81.688, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 136.63300000000004, "r_x1": 93.026, "r_y1": 136.63300000000004, "r_x2": 93.026, "r_y2": 133.49699999999996, "r_x3": 86.413, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 142.34500000000003, "r_x1": 84.524, "r_y1": 142.34500000000003, "r_x2": 84.524, "r_y2": 139.20899999999995, "r_x3": 81.688, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 142.34500000000003, "r_x1": 93.026, "r_y1": 142.34500000000003, "r_x2": 93.026, "r_y2": 139.20899999999995, "r_x3": 86.413, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.084, "r_y0": 96.21699999999998, "r_x1": 113.936, "r_y1": 96.21699999999998, "r_x2": 113.936, "r_y2": 90.57100000000003, "r_x3": 88.084, "r_y3": 90.57100000000003, "coord_origin": "TOPLEFT"}, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.81, "r_y0": 103.35699999999997, "r_x1": 119.212, "r_y1": 103.35699999999997, "r_x2": 119.212, "r_y2": 97.71100000000001, "r_x3": 82.81, "r_y3": 97.71100000000001, "coord_origin": "TOPLEFT"}, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.942, "r_y0": 106.322, "r_x1": 180.011, "r_y1": 106.322, "r_x2": 180.011, "r_y2": 100.67600000000004, "r_x3": 143.942, "r_y3": 100.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.941, "r_y0": 113.46199999999999, "r_x1": 172.012, "r_y1": 113.46199999999999, "r_x2": 172.012, "r_y2": 107.81600000000003, "r_x3": 151.941, "r_y3": 107.81600000000003, "coord_origin": "TOPLEFT"}, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.769, "r_y0": 86.64999999999998, "r_x1": 266.396, "r_y1": 86.64999999999998, "r_x2": 266.396, "r_y2": 81.00400000000002, "r_x3": 251.769, "r_y3": 81.00400000000002, "coord_origin": "TOPLEFT"}, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.516, "r_y0": 91.75, "r_x1": 270.65, "r_y1": 91.75, "r_x2": 270.65, "r_y2": 86.10400000000004, "r_x3": 247.516, "r_y3": 86.10400000000004, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.037, "r_y0": 84.279, "r_x1": 352.126, "r_y1": 84.279, "r_x2": 352.126, "r_y2": 78.63300000000004, "r_x3": 331.037, "r_y3": 78.63300000000004, "coord_origin": "TOPLEFT"}, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.564, "r_y0": 101.75199999999995, "r_x1": 431.726, "r_y1": 101.75199999999995, "r_x2": 431.726, "r_y2": 96.106, "r_x3": 390.564, "r_y3": 96.106, "coord_origin": "TOPLEFT"}, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.824, "r_y0": 107.87199999999996, "r_x1": 435.47, "r_y1": 107.87199999999996, "r_x2": 435.47, "r_y2": 102.226, "r_x3": 386.824, "r_y3": 102.226, "coord_origin": "TOPLEFT"}, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 388.696, "r_y0": 113.99199999999996, "r_x1": 433.603, "r_y1": 113.99199999999996, "r_x2": 433.603, "r_y2": 108.346, "r_x3": 388.696, "r_y3": 108.346, "coord_origin": "TOPLEFT"}, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.078, "r_y0": 120.11199999999997, "r_x1": 431.225, "r_y1": 120.11199999999997, "r_x2": 431.225, "r_y2": 114.46600000000001, "r_x3": 391.078, "r_y3": 114.46600000000001, "coord_origin": "TOPLEFT"}, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.227, "r_y0": 157.40499999999997, "r_x1": 498.821, "r_y1": 157.40499999999997, "r_x2": 498.821, "r_y2": 151.75900000000001, "r_x3": 431.227, "r_y3": 151.75900000000001, "coord_origin": "TOPLEFT"}, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.174, "r_y0": 163.52499999999998, "r_x1": 498.878, "r_y1": 163.52499999999998, "r_x2": 498.878, "r_y2": 157.87900000000002, "r_x3": 431.174, "r_y3": 157.87900000000002, "coord_origin": "TOPLEFT"}, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.529, "r_y0": 169.64499999999998, "r_x1": 489.518, "r_y1": 169.64499999999998, "r_x2": 489.518, "r_y2": 163.99900000000002, "r_x3": 440.529, "r_y3": 163.99900000000002, "coord_origin": "TOPLEFT"}, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.375, "r_y0": 183.97299999999996, "r_x1": 367.723, "r_y1": 183.97299999999996, "r_x2": 367.723, "r_y2": 178.327, "r_x3": 328.375, "r_y3": 178.327, "coord_origin": "TOPLEFT"}, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.845, "r_y0": 129.62800000000004, "r_x1": 373.68, "r_y1": 129.62800000000004, "r_x2": 373.68, "r_y2": 123.98199999999997, "r_x3": 331.845, "r_y3": 123.98199999999997, "coord_origin": "TOPLEFT"}, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.845, "r_y0": 134.72799999999995, "r_x1": 381.178, "r_y1": 134.72799999999995, "r_x2": 381.178, "r_y2": 129.082, "r_x3": 331.845, "r_y3": 129.082, "coord_origin": "TOPLEFT"}, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.626, "r_y0": 93.83600000000001, "r_x1": 219.423, "r_y1": 93.83600000000001, "r_x2": 219.423, "r_y2": 88.19000000000005, "r_x3": 196.626, "r_y3": 88.19000000000005, "coord_origin": "TOPLEFT"}, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.668, "r_y0": 135.21400000000006, "r_x1": 271.499, "r_y1": 135.21400000000006, "r_x2": 271.499, "r_y2": 129.56799999999998, "r_x3": 246.668, "r_y3": 129.56799999999998, "coord_origin": "TOPLEFT"}, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.516, "r_y0": 140.31399999999996, "r_x1": 270.65, "r_y1": 140.31399999999996, "r_x2": 270.65, "r_y2": 134.668, "r_x3": 247.516, "r_y3": 134.668, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 94.73900000000003, "r_x1": 365.553, "r_y1": 94.73900000000003, "r_x2": 365.553, "r_y2": 89.09299999999996, "r_x3": 330.631, "r_y3": 89.09299999999996, "coord_origin": "TOPLEFT"}, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 102.899, "r_x1": 370.227, "r_y1": 102.899, "r_x2": 370.227, "r_y2": 97.25300000000004, "r_x3": 330.631, "r_y3": 97.25300000000004, "coord_origin": "TOPLEFT"}, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 111.05899999999997, "r_x1": 374.512, "r_y1": 111.05899999999997, "r_x2": 374.512, "r_y2": 105.41300000000001, "r_x3": 330.631, "r_y3": 105.41300000000001, "coord_origin": "TOPLEFT"}, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 119.21900000000005, "r_x1": 335.732, "r_y1": 119.21900000000005, "r_x2": 335.732, "r_y2": 113.57299999999998, "r_x3": 330.631, "r_y3": 113.57299999999998, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 146.558, "r_x1": 335.06, "r_y1": 146.558, "r_x2": 335.06, "r_y2": 141.85400000000004, "r_x3": 322.306, "r_y3": 141.85400000000004, "coord_origin": "TOPLEFT"}, "text": "<TR>", "orig": "<TR>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 153.69799999999998, "r_x1": 421.588, "r_y1": 153.69799999999998, "r_x2": 421.588, "r_y2": 148.99400000000003, "r_x3": 322.306, "r_y3": 148.99400000000003, "coord_origin": "TOPLEFT"}, "text": "<TD> 1 </TD><TD colspan=\"2\"> 2 </TD>", "orig": "<TD> 1 </TD><TD colspan=\"2\"> 2 </TD>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 160.83799999999997, "r_x1": 349.23, "r_y1": 160.83799999999997, "r_x2": 349.23, "r_y2": 156.13400000000001, "r_x3": 322.306, "r_y3": 156.13400000000001, "coord_origin": "TOPLEFT"}, "text": "</TR><TR>", "orig": "</TR><TR>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 167.97799999999995, "r_x1": 374.737, "r_y1": 167.97799999999995, "r_x2": 374.737, "r_y2": 163.274, "r_x3": 322.306, "r_y3": 163.274, "coord_origin": "TOPLEFT"}, "text": "<TD> 3 </TD><TD>...", "orig": "<TD> 3 </TD><TD>...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 175.11800000000005, "r_x1": 326.557, "r_y1": 175.11800000000005, "r_x2": 326.557, "r_y2": 170.414, "r_x3": 322.306, "r_y3": 170.414, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.511, "r_y0": 95.38900000000001, "r_x1": 326.914, "r_y1": 95.38900000000001, "r_x2": 326.914, "r_y2": 89.74300000000005, "r_x3": 323.511, "r_y3": 89.74300000000005, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.715, "r_y0": 103.50800000000004, "r_x1": 327.118, "r_y1": 103.50800000000004, "r_x2": 327.118, "r_y2": 97.86199999999997, "r_x3": 323.715, "r_y3": 97.86199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.715, "r_y0": 111.70899999999995, "r_x1": 327.118, "r_y1": 111.70899999999995, "r_x2": 327.118, "r_y2": 106.06299999999999, "r_x3": 323.715, "r_y3": 106.06299999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.464, "r_y0": 110.26499999999999, "r_x1": 457.867, "r_y1": 110.26499999999999, "r_x2": 457.867, "r_y2": 104.61900000000003, "r_x3": 454.464, "r_y3": 104.61900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.326, "r_y0": 96.81500000000005, "r_x1": 496.729, "r_y1": 96.81500000000005, "r_x2": 496.729, "r_y2": 91.16899999999998, "r_x3": 493.326, "r_y3": 91.16899999999998, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.083, "r_y0": 96.28800000000001, "r_x1": 457.486, "r_y1": 96.28800000000001, "r_x2": 457.486, "r_y2": 90.64200000000005, "r_x3": 454.083, "r_y3": 90.64200000000005, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 212.92600000000004, "r_x1": 86.884, "r_y1": 212.92600000000004, "r_x2": 86.884, "r_y2": 204.37400000000002, "r_x3": 50.112, "r_y3": 204.37400000000002, "coord_origin": "TOPLEFT"}, "text": "Figure 3:", "orig": "Figure 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.021, "r_y0": 212.942, "r_x1": 149.851, "r_y1": 212.942, "r_x2": 149.851, "r_y2": 203.986, "r_x3": 94.021, "r_y3": 203.986, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.861, "r_y0": 212.92600000000004, "r_x1": 545.108, "r_y1": 212.92600000000004, "r_x2": 545.108, "r_y2": 204.37400000000002, "r_x3": 152.861, "r_y3": 204.37400000000002, "coord_origin": "TOPLEFT"}, "text": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "orig": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 224.88099999999997, "r_x1": 436.013, "r_y1": 224.88099999999997, "r_x2": 436.013, "r_y2": 216.32899999999995, "r_x3": 50.112, "r_y3": 216.32899999999995, "coord_origin": "TOPLEFT"}, "text": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "orig": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 74.253, "r_y0": 263.884, "r_x1": 101.758, "r_y1": 263.884, "r_x2": 101.758, "r_y2": 259.52, "r_x3": 74.253, "r_y3": 259.52, "coord_origin": "TOPLEFT"}, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.3, "r_y0": 264.015, "r_x1": 157.84, "r_y1": 264.015, "r_x2": 157.84, "r_y2": 259.65, "r_x3": 122.3, "r_y3": 259.65, "coord_origin": "TOPLEFT"}, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.549, "r_y0": 376.78, "r_x1": 125.684, "r_y1": 376.78, "r_x2": 125.684, "r_y2": 372.588, "r_x3": 78.549, "r_y3": 372.588, "coord_origin": "TOPLEFT"}, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.513, "r_y0": 396.713, "r_x1": 125.111, "r_y1": 396.713, "r_x2": 125.111, "r_y2": 392.52, "r_x3": 78.513, "r_y3": 392.52, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.025, "r_y0": 429.848, "r_x1": 127.923, "r_y1": 429.848, "r_x2": 127.923, "r_y2": 425.655, "r_x3": 76.025, "r_y3": 425.655, "coord_origin": "TOPLEFT"}, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.383, "r_y0": 450.284, "r_x1": 124.98, "r_y1": 450.284, "r_x2": 124.98, "r_y2": 446.091, "r_x3": 78.383, "r_y3": 446.091, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.469, "r_y0": 467.838, "r_x1": 181.629, "r_y1": 467.838, "r_x2": 181.629, "r_y2": 463.645, "r_x3": 167.469, "r_y3": 463.645, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 165.613, "r_y0": 483.866, "r_x1": 184.432, "r_y1": 483.866, "r_x2": 184.432, "r_y2": 479.673, "r_x3": 165.613, "r_y3": 479.673, "coord_origin": "TOPLEFT"}, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.32, "r_y0": 329.941, "r_x1": 132.925, "r_y1": 329.941, "r_x2": 132.925, "r_y2": 325.527, "r_x3": 65.32, "r_y3": 325.527, "coord_origin": "TOPLEFT"}, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.515, "r_y0": 274.491, "r_x1": 126.837, "r_y1": 274.491, "r_x2": 126.837, "r_y2": 270.73900000000003, "r_x3": 119.515, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "[30,", "orig": "[30,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.2, "r_y0": 274.491, "r_x1": 132.745, "r_y1": 274.491, "r_x2": 132.745, "r_y2": 270.73900000000003, "r_x3": 129.2, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "1,", "orig": "1,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 135.108, "r_y0": 274.491, "r_x1": 138.652, "r_y1": 274.491, "r_x2": 138.652, "r_y2": 270.73900000000003, "r_x3": 135.108, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "2,", "orig": "2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.015, "r_y0": 274.491, "r_x1": 144.56, "r_y1": 274.491, "r_x2": 144.56, "r_y2": 270.73900000000003, "r_x3": 141.015, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "3,", "orig": "3,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 146.923, "r_y0": 274.491, "r_x1": 160.625, "r_y1": 274.491, "r_x2": 160.625, "r_y2": 270.73900000000003, "r_x3": 146.923, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "4, \u20263,", "orig": "4, \u20263,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.729, "r_y0": 279.741, "r_x1": 132.273, "r_y1": 279.741, "r_x2": 132.273, "r_y2": 275.98900000000003, "r_x3": 128.729, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "4,", "orig": "4,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.636, "r_y0": 279.741, "r_x1": 138.181, "r_y1": 279.741, "r_x2": 138.181, "r_y2": 275.98900000000003, "r_x3": 134.636, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "5,", "orig": "5,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.544, "r_y0": 279.741, "r_x1": 151.411, "r_y1": 279.741, "r_x2": 151.411, "r_y2": 275.98900000000003, "r_x3": 140.544, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "8, 31]", "orig": "8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.434, "r_y0": 343.926, "r_x1": 79.019, "r_y1": 343.926, "r_x2": 79.019, "r_y2": 340.521, "r_x3": 60.434, "r_y3": 340.521, "coord_origin": "TOPLEFT"}, "text": "Positional", "orig": "Positional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.598, "r_y0": 348.352, "r_x1": 78.855, "r_y1": 348.352, "r_x2": 78.855, "r_y2": 344.948, "r_x3": 60.598, "r_y3": 344.948, "coord_origin": "TOPLEFT"}, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.829, "r_y0": 298.344, "r_x1": 153.414, "r_y1": 298.344, "r_x2": 153.414, "r_y2": 294.939, "r_x3": 134.829, "r_y3": 294.939, "coord_origin": "TOPLEFT"}, "text": "Positional", "orig": "Positional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.993, "r_y0": 302.77, "r_x1": 153.25, "r_y1": 302.77, "r_x2": 153.25, "r_y2": 299.365, "r_x3": 134.993, "r_y3": 299.365, "coord_origin": "TOPLEFT"}, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 350.753, "r_x1": 197.149, "r_y1": 350.753, "r_x2": 197.149, "r_y2": 346.56, "r_x3": 150.552, "r_y3": 346.56, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 399.818, "r_x1": 197.149, "r_y1": 399.818, "r_x2": 197.149, "r_y2": 395.625, "r_x3": 150.552, "r_y3": 395.625, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.185, "r_y0": 381.063, "r_x1": 197.32, "r_y1": 381.063, "r_x2": 197.32, "r_y2": 376.87, "r_x3": 150.185, "r_y3": 376.87, "coord_origin": "TOPLEFT"}, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 445.643, "r_x1": 197.149, "r_y1": 445.643, "r_x2": 197.149, "r_y2": 441.45, "r_x3": 150.552, "r_y3": 441.45, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.864, "r_y0": 427.488, "r_x1": 199.762, "r_y1": 427.488, "r_x2": 199.762, "r_y2": 423.295, "r_x3": 147.864, "r_y3": 423.295, "coord_origin": "TOPLEFT"}, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.566, "r_y0": 319.657, "r_x1": 255.725, "r_y1": 319.657, "r_x2": 255.725, "r_y2": 315.465, "r_x3": 241.566, "r_y3": 315.465, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.917, "r_y0": 366.759, "r_x1": 256.077, "r_y1": 366.759, "r_x2": 256.077, "r_y2": 362.567, "r_x3": 241.917, "r_y3": 362.567, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.054, "r_y0": 342.014, "r_x1": 269.393, "r_y1": 342.014, "r_x2": 269.393, "r_y2": 337.821, "r_x3": 228.054, "r_y3": 337.821, "coord_origin": "TOPLEFT"}, "text": "Attention Network", "orig": "Attention Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.446, "r_y0": 410.541, "r_x1": 238.739, "r_y1": 410.541, "r_x2": 238.739, "r_y2": 406.349, "r_x3": 228.446, "r_y3": 406.349, "coord_origin": "TOPLEFT"}, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.298, "r_y0": 410.598, "r_x1": 270.457, "r_y1": 410.598, "r_x2": 270.457, "r_y2": 406.405, "r_x3": 256.298, "r_y3": 406.405, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.545, "r_y0": 387.608, "r_x1": 258.089, "r_y1": 387.608, "r_x2": 258.089, "r_y2": 383.415, "r_x3": 239.545, "r_y3": 383.415, "coord_origin": "TOPLEFT"}, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 59.258, "r_y0": 449.783, "r_x1": 59.245, "r_y1": 384.871, "r_x2": 55.273, "r_y2": 384.872, "r_x3": 55.286, "r_y3": 449.784, "coord_origin": "TOPLEFT"}, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 59.058, "r_y0": 378.454, "r_x1": 59.055, "r_y1": 373.809, "r_x2": 55.345, "r_y2": 373.812, "r_x3": 55.348, "r_y3": 378.457, "coord_origin": "TOPLEFT"}, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.296, "r_y0": 490.108, "r_x1": 122.166, "r_y1": 490.098, "r_x2": 122.165, "r_y2": 485.687, "r_x3": 85.295, "r_y3": 485.697, "coord_origin": "TOPLEFT"}, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.666, "r_y0": 285.074, "r_x1": 265.321, "r_y1": 285.064, "r_x2": 265.32, "r_y2": 281.281, "r_x3": 229.665, "r_y3": 281.291, "coord_origin": "TOPLEFT"}, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.174, "r_y0": 505.871, "r_x1": 190.419, "r_y1": 505.862, "r_x2": 190.417, "r_y2": 501.45, "r_x3": 157.172, "r_y3": 501.459, "coord_origin": "TOPLEFT"}, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.816, "r_y0": 443.634, "r_x1": 269.396, "r_y1": 443.622, "r_x2": 269.395, "r_y2": 439.211, "r_x3": 227.815, "r_y3": 439.222, "coord_origin": "TOPLEFT"}, "text": "Bounding Boxes &", "orig": "Bounding Boxes &", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.703, "r_y0": 449.632, "r_x1": 263.513, "r_y1": 449.624, "r_x2": 263.511, "r_y2": 445.212, "r_x3": 233.701, "r_y3": 445.22, "coord_origin": "TOPLEFT"}, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.747, "r_y0": 298.506, "r_x1": 210.91, "r_y1": 298.506, "r_x2": 210.91, "r_y2": 294.534, "r_x3": 184.747, "r_y3": 294.534, "coord_origin": "TOPLEFT"}, "text": "Transformer", "orig": "Transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.912, "r_y0": 304.256, "r_x1": 216.744, "r_y1": 304.256, "r_x2": 216.744, "r_y2": 300.284, "r_x3": 178.912, "r_y3": 300.284, "coord_origin": "TOPLEFT"}, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.246, "r_y0": 287.601, "r_x1": 198.891, "r_y1": 287.601, "r_x2": 198.891, "r_y2": 283.891, "r_x3": 194.246, "r_y3": 283.891, "coord_origin": "TOPLEFT"}, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.456, "r_y0": 277.548, "r_x1": 276.471, "r_y1": 277.548, "r_x2": 276.471, "r_y2": 273.134, "r_x3": 221.456, "r_y3": 273.134, "coord_origin": "TOPLEFT"}, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.652, "r_y0": 328.837, "r_x1": 195.97, "r_y1": 328.837, "r_x2": 195.97, "r_y2": 324.644, "r_x3": 151.652, "r_y3": 324.644, "coord_origin": "TOPLEFT"}, "text": "Masked Multi-Head", "orig": "Masked Multi-Head", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.433, "r_y0": 334.837, "r_x1": 184.19, "r_y1": 334.837, "r_x2": 184.19, "r_y2": 330.644, "r_x3": 163.433, "r_y3": 330.644, "coord_origin": "TOPLEFT"}, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 536.723, "r_x1": 85.878, "r_y1": 536.723, "r_x2": 85.878, "r_y2": 528.171, "r_x3": 50.112, "r_y3": 528.171, "coord_origin": "TOPLEFT"}, "text": "Figure 4:", "orig": "Figure 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 90.73, "r_y0": 536.723, "r_x1": 229.787, "r_y1": 536.723, "r_x2": 229.787, "r_y2": 528.171, "r_x3": 90.73, "r_y3": 528.171, "coord_origin": "TOPLEFT"}, "text": "Given an input image of a table, the", "orig": "Given an input image of a table, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 231.787, "r_y0": 536.739, "r_x1": 267.762, "r_y1": 536.739, "r_x2": 267.762, "r_y2": 527.783, "r_x3": 231.787, "r_y3": 527.783, "coord_origin": "TOPLEFT"}, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 269.764, "r_y0": 536.723, "r_x1": 286.362, "r_y1": 536.723, "r_x2": 286.362, "r_y2": 528.171, "r_x3": 269.764, "r_y3": 528.171, "coord_origin": "TOPLEFT"}, "text": "pro-", "orig": "pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 548.678, "r_x1": 286.365, "r_y1": 548.678, "r_x2": 286.365, "r_y2": 540.126, "r_x3": 50.112, "r_y3": 540.126, "coord_origin": "TOPLEFT"}, "text": "duces fixed-length features that represent the input image.", "orig": "duces fixed-length features that represent the input image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 560.634, "r_x1": 205.847, "r_y1": 560.634, "r_x2": 205.847, "r_y2": 552.082, "r_x3": 50.112, "r_y3": 552.082, "coord_origin": "TOPLEFT"}, "text": "The features are then passed to both the", "orig": "The features are then passed to both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.018, "r_y0": 560.65, "r_x1": 286.364, "r_y1": 560.65, "r_x2": 286.364, "r_y2": 551.694, "r_x3": 208.018, "r_y3": 551.694, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 572.5889999999999, "r_x1": 64.498, "r_y1": 572.5889999999999, "r_x2": 64.498, "r_y2": 564.037, "r_x3": 50.112, "r_y3": 564.037, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 68.165, "r_y0": 572.605, "r_x1": 151.313, "r_y1": 572.605, "r_x2": 151.313, "r_y2": 563.649, "r_x3": 68.165, "r_y3": 563.649, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.313, "r_y0": 572.5889999999999, "r_x1": 153.804, "r_y1": 572.5889999999999, "r_x2": 153.804, "r_y2": 564.037, "r_x3": 151.313, "r_y3": 564.037, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.419, "r_y0": 572.5889999999999, "r_x1": 241.933, "r_y1": 572.5889999999999, "r_x2": 241.933, "r_y2": 564.037, "r_x3": 160.419, "r_y3": 564.037, "coord_origin": "TOPLEFT"}, "text": "During training, the", "orig": "During training, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.595, "r_y0": 572.605, "r_x1": 286.362, "r_y1": 572.605, "r_x2": 286.362, "r_y2": 563.649, "r_x3": 245.595, "r_y3": 563.649, "coord_origin": "TOPLEFT"}, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 584.56, "r_x1": 85.519, "r_y1": 584.56, "r_x2": 85.519, "r_y2": 575.604, "r_x3": 50.112, "r_y3": 575.604, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.623, "r_y0": 584.544, "r_x1": 286.361, "r_y1": 584.544, "r_x2": 286.361, "r_y2": 575.992, "r_x3": 88.623, "r_y3": 575.992, "coord_origin": "TOPLEFT"}, "text": "receives 'tokenized tags' of the HTML code that", "orig": "receives 'tokenized tags' of the HTML code that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 596.499, "r_x1": 286.365, "r_y1": 596.499, "r_x2": 286.365, "r_y2": 587.947, "r_x3": 50.112, "r_y3": 587.947, "coord_origin": "TOPLEFT"}, "text": "represent the table structure. Afterwards, a transformer en-", "orig": "represent the table structure. Afterwards, a transformer en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 608.454, "r_x1": 286.365, "r_y1": 608.454, "r_x2": 286.365, "r_y2": 599.902, "r_x3": 50.112, "r_y3": 599.902, "coord_origin": "TOPLEFT"}, "text": "coder and decoder architecture is employed to produce fea-", "orig": "coder and decoder architecture is employed to produce fea-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 620.409, "r_x1": 240.438, "r_y1": 620.409, "r_x2": 240.438, "r_y2": 611.857, "r_x3": 50.112, "r_y3": 611.857, "coord_origin": "TOPLEFT"}, "text": "tures that are received by a linear layer, and the", "orig": "tures that are received by a linear layer, and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.198, "r_y0": 620.425, "r_x1": 286.366, "r_y1": 620.425, "r_x2": 286.366, "r_y2": 611.469, "r_x3": 243.198, "r_y3": 611.469, "coord_origin": "TOPLEFT"}, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 632.381, "r_x1": 87.013, "r_y1": 632.381, "r_x2": 87.013, "r_y2": 623.425, "r_x3": 50.112, "r_y3": 623.425, "coord_origin": "TOPLEFT"}, "text": "Decoder.", "orig": "Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.14, "r_y0": 632.381, "r_x1": 286.365, "r_y1": 632.381, "r_x2": 286.365, "r_y2": 623.425, "r_x3": 93.14, "r_y3": 623.425, "coord_origin": "TOPLEFT"}, "text": "The linear layer is applied to the features to", "orig": "The linear layer is applied to the features to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 644.336, "r_x1": 286.365, "r_y1": 644.336, "r_x2": 286.365, "r_y2": 635.38, "r_x3": 50.112, "r_y3": 635.38, "coord_origin": "TOPLEFT"}, "text": "predict the tags. Simultaneously, the Cell BBox Decoder", "orig": "predict the tags. Simultaneously, the Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 656.275, "r_x1": 220.582, "r_y1": 656.275, "r_x2": 220.582, "r_y2": 647.723, "r_x3": 50.112, "r_y3": 647.723, "coord_origin": "TOPLEFT"}, "text": "selects features referring to the data cells ('", "orig": "selects features referring to the data cells ('", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.578, "r_y0": 656.111, "r_x1": 228.327, "r_y1": 656.111, "r_x2": 228.327, "r_y2": 647.405, "r_x3": 220.578, "r_y3": 647.405, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.327, "r_y0": 656.275, "r_x1": 236.078, "r_y1": 656.275, "r_x2": 236.078, "r_y2": 647.723, "r_x3": 228.327, "r_y3": 647.723, "coord_origin": "TOPLEFT"}, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.078, "r_y0": 656.111, "r_x1": 243.827, "r_y1": 656.111, "r_x2": 243.827, "r_y2": 647.405, "r_x3": 236.078, "r_y3": 647.405, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.826, "r_y0": 656.275, "r_x1": 255.293, "r_y1": 656.275, "r_x2": 255.293, "r_y2": 647.723, "r_x3": 243.826, "r_y3": 647.723, "coord_origin": "TOPLEFT"}, "text": "', '", "orig": "', '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.291, "r_y0": 656.111, "r_x1": 263.04, "r_y1": 656.111, "r_x2": 263.04, "r_y2": 647.405, "r_x3": 255.291, "r_y3": 647.405, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.04, "r_y0": 656.275, "r_x1": 286.362, "r_y1": 656.275, "r_x2": 286.362, "r_y2": 647.723, "r_x3": 263.04, "r_y3": 647.723, "coord_origin": "TOPLEFT"}, "text": "') and", "orig": "') and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 668.23, "r_x1": 286.365, "r_y1": 668.23, "r_x2": 286.365, "r_y2": 659.678, "r_x3": 50.112, "r_y3": 659.678, "coord_origin": "TOPLEFT"}, "text": "passes them through an attention network, an MLP, and a", "orig": "passes them through an attention network, an MLP, and a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 680.185, "r_x1": 218.47, "r_y1": 680.185, "r_x2": 218.47, "r_y2": 671.633, "r_x3": 50.112, "r_y3": 671.633, "coord_origin": "TOPLEFT"}, "text": "linear layer to predict the bounding boxes.", "orig": "linear layer to predict the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.355, "r_x1": 545.115, "r_y1": 258.355, "r_x2": 545.115, "r_y2": 249.803, "r_x3": 308.862, "r_y3": 249.803, "coord_origin": "TOPLEFT"}, "text": "forming classification, and adding an adaptive pooling layer", "orig": "forming classification, and adding an adaptive pooling layer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 270.31100000000004, "r_x1": 366.466, "r_y1": 270.31100000000004, "r_x2": 366.466, "r_y2": 261.759, "r_x3": 308.862, "r_y3": 261.759, "coord_origin": "TOPLEFT"}, "text": "of size 28*28.", "orig": "of size 28*28.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 371.706, "r_y0": 270.31100000000004, "r_x1": 545.115, "r_y1": 270.31100000000004, "r_x2": 545.115, "r_y2": 261.759, "r_x3": 371.706, "r_y3": 261.759, "coord_origin": "TOPLEFT"}, "text": "ResNet by default downsamples the image", "orig": "ResNet by default downsamples the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 282.266, "r_x1": 545.115, "r_y1": 282.266, "r_x2": 545.115, "r_y2": 273.71400000000006, "r_x3": 308.862, "r_y3": 273.71400000000006, "coord_origin": "TOPLEFT"}, "text": "resolution by 32 and then the encoded image is provided to", "orig": "resolution by 32 and then the encoded image is provided to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 294.221, "r_x1": 341.24, "r_y1": 294.221, "r_x2": 341.24, "r_y2": 285.669, "r_x3": 308.862, "r_y3": 285.669, "coord_origin": "TOPLEFT"}, "text": "both the", "orig": "both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 343.731, "r_y0": 294.078, "r_x1": 417.235, "r_y1": 294.078, "r_x2": 417.235, "r_y2": 285.49, "r_x3": 343.731, "r_y3": 285.49, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.234, "r_y0": 294.221, "r_x1": 436.601, "r_y1": 294.221, "r_x2": 436.601, "r_y2": 285.669, "r_x3": 417.234, "r_y3": 285.669, "coord_origin": "TOPLEFT"}, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.092, "r_y0": 294.078, "r_x1": 516.561, "r_y1": 294.078, "r_x2": 516.561, "r_y2": 285.49, "r_x3": 439.092, "r_y3": 285.49, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.561, "r_y0": 294.221, "r_x1": 519.052, "r_y1": 294.221, "r_x2": 519.052, "r_y2": 285.669, "r_x3": 516.561, "r_y3": 285.669, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 306.296, "r_x1": 400.866, "r_y1": 306.296, "r_x2": 400.866, "r_y2": 297.34, "r_x3": 320.817, "r_y3": 297.34, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder.", "orig": "Structure Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 403.914, "r_y0": 306.28, "r_x1": 545.114, "r_y1": 306.28, "r_x2": 545.114, "r_y2": 297.728, "r_x3": 403.914, "r_y3": 297.728, "coord_origin": "TOPLEFT"}, "text": "The transformer architecture of this", "orig": "The transformer architecture of this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 318.235, "r_x1": 517.529, "r_y1": 318.235, "r_x2": 517.529, "r_y2": 309.683, "r_x3": 308.862, "r_y3": 309.683, "coord_origin": "TOPLEFT"}, "text": "component is based on the work proposed in [31].", "orig": "component is based on the work proposed in [31].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 524.094, "r_y0": 318.235, "r_x1": 545.115, "r_y1": 318.235, "r_x2": 545.115, "r_y2": 309.683, "r_x3": 524.094, "r_y3": 309.683, "coord_origin": "TOPLEFT"}, "text": "After", "orig": "After", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 330.19, "r_x1": 432.358, "r_y1": 330.19, "r_x2": 432.358, "r_y2": 321.638, "r_x3": 308.862, "r_y3": 321.638, "coord_origin": "TOPLEFT"}, "text": "extensive experimentation, the", "orig": "extensive experimentation, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.82, "r_y0": 330.047, "r_x1": 510.29, "r_y1": 330.047, "r_x2": 510.29, "r_y2": 321.459, "r_x3": 435.82, "r_y3": 321.459, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.978, "r_y0": 330.19, "r_x1": 520.623, "r_y1": 330.19, "r_x2": 520.623, "r_y2": 321.638, "r_x3": 513.978, "r_y3": 321.638, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 524.08, "r_y0": 330.19, "r_x1": 545.111, "r_y1": 330.19, "r_x2": 545.111, "r_y2": 321.638, "r_x3": 524.08, "r_y3": 321.638, "coord_origin": "TOPLEFT"}, "text": "mod-", "orig": "mod-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 342.145, "r_x1": 545.115, "r_y1": 342.145, "r_x2": 545.115, "r_y2": 333.593, "r_x3": 308.862, "r_y3": 333.593, "coord_origin": "TOPLEFT"}, "text": "eled as a transformer encoder with two encoder layers and", "orig": "eled as a transformer encoder with two encoder layers and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 354.1, "r_x1": 545.115, "r_y1": 354.1, "r_x2": 545.115, "r_y2": 345.548, "r_x3": 308.862, "r_y3": 345.548, "coord_origin": "TOPLEFT"}, "text": "a transformer decoder made from a stack of 4 decoder lay-", "orig": "a transformer decoder made from a stack of 4 decoder lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 366.056, "r_x1": 545.115, "r_y1": 366.056, "r_x2": 545.115, "r_y2": 357.504, "r_x3": 308.862, "r_y3": 357.504, "coord_origin": "TOPLEFT"}, "text": "ers that comprise mainly of multi-head attention and feed", "orig": "ers that comprise mainly of multi-head attention and feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 378.011, "r_x1": 370.391, "r_y1": 378.011, "r_x2": 370.391, "r_y2": 369.459, "r_x3": 308.862, "r_y3": 369.459, "coord_origin": "TOPLEFT"}, "text": "forward layers.", "orig": "forward layers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.445, "r_y0": 378.011, "r_x1": 545.115, "r_y1": 378.011, "r_x2": 545.115, "r_y2": 369.459, "r_x3": 377.445, "r_y3": 369.459, "coord_origin": "TOPLEFT"}, "text": "This configuration uses fewer layers and", "orig": "This configuration uses fewer layers and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 389.966, "r_x1": 545.115, "r_y1": 389.966, "r_x2": 545.115, "r_y2": 381.414, "r_x3": 308.862, "r_y3": 381.414, "coord_origin": "TOPLEFT"}, "text": "heads in comparison to networks applied to other problems", "orig": "heads in comparison to networks applied to other problems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 401.921, "r_x1": 326.566, "r_y1": 401.921, "r_x2": 326.566, "r_y2": 393.369, "r_x3": 308.862, "r_y3": 393.369, "coord_origin": "TOPLEFT"}, "text": "(e.g.", "orig": "(e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.069, "r_y0": 401.921, "r_x1": 545.115, "r_y1": 401.921, "r_x2": 545.115, "r_y2": 393.369, "r_x3": 331.069, "r_y3": 393.369, "coord_origin": "TOPLEFT"}, "text": "'Scene Understanding', 'Image Captioning'), some-", "orig": "'Scene Understanding', 'Image Captioning'), some-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 413.876, "r_x1": 528.019, "r_y1": 413.876, "r_x2": 528.019, "r_y2": 405.324, "r_x3": 308.862, "r_y3": 405.324, "coord_origin": "TOPLEFT"}, "text": "thing which we relate to the simplicity of table images.", "orig": "thing which we relate to the simplicity of table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 425.935, "r_x1": 336.309, "r_y1": 425.935, "r_x2": 336.309, "r_y2": 417.383, "r_x3": 320.817, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.579, "r_y0": 425.935, "r_x1": 388.055, "r_y1": 425.935, "r_x2": 388.055, "r_y2": 417.383, "r_x3": 341.579, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "transformer", "orig": "transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.325, "r_y0": 425.935, "r_x1": 424.856, "r_y1": 425.935, "r_x2": 424.856, "r_y2": 417.383, "r_x3": 393.325, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "encoder", "orig": "encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.117, "r_y0": 425.935, "r_x1": 462.356, "r_y1": 425.935, "r_x2": 462.356, "r_y2": 417.383, "r_x3": 430.117, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "receives", "orig": "receives", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 467.626, "r_y0": 425.935, "r_x1": 477.031, "r_y1": 425.935, "r_x2": 477.031, "r_y2": 417.383, "r_x3": 467.626, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "an", "orig": "an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 482.301, "r_y0": 425.935, "r_x1": 515.496, "r_y1": 425.935, "r_x2": 515.496, "r_y2": 417.383, "r_x3": 482.301, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "encoded", "orig": "encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 520.766, "r_y0": 425.935, "r_x1": 545.115, "r_y1": 425.935, "r_x2": 545.115, "r_y2": 417.383, "r_x3": 520.766, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 437.89, "r_x1": 343.721, "r_y1": 437.89, "r_x2": 343.721, "r_y2": 429.338, "r_x3": 308.862, "r_y3": 429.338, "coord_origin": "TOPLEFT"}, "text": "from the", "orig": "from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.038, "r_y0": 437.747, "r_x1": 446.455, "r_y1": 437.747, "r_x2": 446.455, "r_y2": 429.159, "r_x3": 347.038, "r_y3": 429.159, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.94, "r_y0": 437.89, "r_x1": 545.113, "r_y1": 437.89, "r_x2": 545.113, "r_y2": 429.338, "r_x3": 449.94, "r_y3": 429.338, "coord_origin": "TOPLEFT"}, "text": "and refines it through a", "orig": "and refines it through a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 449.845, "r_x1": 545.115, "r_y1": 449.845, "r_x2": 545.115, "r_y2": 441.293, "r_x3": 308.862, "r_y3": 441.293, "coord_origin": "TOPLEFT"}, "text": "multi-head dot-product attention layer, followed by a Feed", "orig": "multi-head dot-product attention layer, followed by a Feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 461.8, "r_x1": 384.149, "r_y1": 461.8, "r_x2": 384.149, "r_y2": 453.248, "r_x3": 308.862, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "Forward Network.", "orig": "Forward Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.375, "r_y0": 461.8, "r_x1": 459.616, "r_y1": 461.8, "r_x2": 459.616, "r_y2": 453.248, "r_x3": 393.375, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "During training,", "orig": "During training,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 464.667, "r_y0": 461.8, "r_x1": 476.841, "r_y1": 461.8, "r_x2": 476.841, "r_y2": 453.248, "r_x3": 464.667, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 481.374, "r_y0": 461.8, "r_x1": 527.85, "r_y1": 461.8, "r_x2": 527.85, "r_y2": 453.248, "r_x3": 481.374, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "transformer", "orig": "transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.393, "r_y0": 461.8, "r_x1": 545.115, "r_y1": 461.8, "r_x2": 545.115, "r_y2": 453.248, "r_x3": 532.393, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "de-", "orig": "de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 473.756, "r_x1": 545.115, "r_y1": 473.756, "r_x2": 545.115, "r_y2": 465.204, "r_x3": 308.862, "r_y3": 465.204, "coord_origin": "TOPLEFT"}, "text": "coder receives as input the output feature produced by the", "orig": "coder receives as input the output feature produced by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 485.711, "r_x1": 545.115, "r_y1": 485.711, "r_x2": 545.115, "r_y2": 477.159, "r_x3": 308.862, "r_y3": 477.159, "coord_origin": "TOPLEFT"}, "text": "transformer encoder, and the tokenized input of the HTML", "orig": "transformer encoder, and the tokenized input of the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 497.666, "r_x1": 545.115, "r_y1": 497.666, "r_x2": 545.115, "r_y2": 489.114, "r_x3": 308.862, "r_y3": 489.114, "coord_origin": "TOPLEFT"}, "text": "ground-truth tags. Using a stack of multi-head attention lay-", "orig": "ground-truth tags. Using a stack of multi-head attention lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 509.621, "r_x1": 545.115, "r_y1": 509.621, "r_x2": 545.115, "r_y2": 501.069, "r_x3": 308.862, "r_y3": 501.069, "coord_origin": "TOPLEFT"}, "text": "ers, different aspects of the tag sequence could be inferred.", "orig": "ers, different aspects of the tag sequence could be inferred.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 521.576, "r_x1": 545.115, "r_y1": 521.576, "r_x2": 545.115, "r_y2": 513.024, "r_x3": 308.862, "r_y3": 513.024, "coord_origin": "TOPLEFT"}, "text": "This is achieved by each attention head on a layer operating", "orig": "This is achieved by each attention head on a layer operating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.5319999999999, "r_x1": 545.115, "r_y1": 533.5319999999999, "r_x2": 545.115, "r_y2": 524.98, "r_x3": 308.862, "r_y3": 524.98, "coord_origin": "TOPLEFT"}, "text": "in a different subspace, and then combining altogether their", "orig": "in a different subspace, and then combining altogether their", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.487, "r_x1": 369.733, "r_y1": 545.487, "r_x2": 369.733, "r_y2": 536.935, "r_x3": 308.862, "r_y3": 536.935, "coord_origin": "TOPLEFT"}, "text": "attention score.", "orig": "attention score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 557.561, "r_x1": 404.762, "r_y1": 557.561, "r_x2": 404.762, "r_y2": 548.605, "r_x3": 320.817, "r_y3": 548.605, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder.", "orig": "Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.341, "r_y0": 557.545, "r_x1": 545.115, "r_y1": 557.545, "r_x2": 545.115, "r_y2": 548.9929999999999, "r_x3": 410.341, "r_y3": 548.9929999999999, "coord_origin": "TOPLEFT"}, "text": "Our architecture allows to simul-", "orig": "Our architecture allows to simul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.501, "r_x1": 545.115, "r_y1": 569.501, "r_x2": 545.115, "r_y2": 560.9490000000001, "r_x3": 308.862, "r_y3": 560.9490000000001, "coord_origin": "TOPLEFT"}, "text": "taneously predict HTML tags and bounding boxes for each", "orig": "taneously predict HTML tags and bounding boxes for each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 581.456, "r_x1": 545.115, "r_y1": 581.456, "r_x2": 545.115, "r_y2": 572.904, "r_x3": 308.862, "r_y3": 572.904, "coord_origin": "TOPLEFT"}, "text": "table cell without the need of a separate object detector end", "orig": "table cell without the need of a separate object detector end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 593.4110000000001, "r_x1": 336.458, "r_y1": 593.4110000000001, "r_x2": 336.458, "r_y2": 584.859, "r_x3": 308.862, "r_y3": 584.859, "coord_origin": "TOPLEFT"}, "text": "to end.", "orig": "to end.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.971, "r_y0": 593.4110000000001, "r_x1": 545.115, "r_y1": 593.4110000000001, "r_x2": 545.115, "r_y2": 584.859, "r_x3": 340.971, "r_y3": 584.859, "coord_origin": "TOPLEFT"}, "text": "This approach is inspired by DETR [1] which em-", "orig": "This approach is inspired by DETR [1] which em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.366, "r_x1": 545.115, "r_y1": 605.366, "r_x2": 545.115, "r_y2": 596.814, "r_x3": 308.862, "r_y3": 596.814, "coord_origin": "TOPLEFT"}, "text": "ploys a Transformer Encoder, and Decoder that looks for", "orig": "ploys a Transformer Encoder, and Decoder that looks for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.321, "r_x1": 545.115, "r_y1": 617.321, "r_x2": 545.115, "r_y2": 608.769, "r_x3": 308.862, "r_y3": 608.769, "coord_origin": "TOPLEFT"}, "text": "a specific number of object queries (potential object detec-", "orig": "a specific number of object queries (potential object detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.2760000000001, "r_x1": 545.115, "r_y1": 629.2760000000001, "r_x2": 545.115, "r_y2": 620.7239999999999, "r_x3": 308.862, "r_y3": 620.7239999999999, "coord_origin": "TOPLEFT"}, "text": "tions). As our model utilizes a transformer architecture, the", "orig": "tions). As our model utilizes a transformer architecture, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.232, "r_x1": 381.679, "r_y1": 641.232, "r_x2": 381.679, "r_y2": 632.6800000000001, "r_x3": 308.862, "r_y3": 632.6800000000001, "coord_origin": "TOPLEFT"}, "text": "hidden state of the", "orig": "hidden state of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.997, "r_y0": 641.068, "r_x1": 391.746, "r_y1": 641.068, "r_x2": 391.746, "r_y2": 632.362, "r_x3": 383.997, "r_y3": 632.362, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.746, "r_y0": 641.232, "r_x1": 399.497, "r_y1": 641.232, "r_x2": 399.497, "r_y2": 632.6800000000001, "r_x3": 391.746, "r_y3": 632.6800000000001, "coord_origin": "TOPLEFT"}, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 399.497, "r_y0": 641.068, "r_x1": 407.246, "r_y1": 641.068, "r_x2": 407.246, "r_y2": 632.362, "r_x3": 399.497, "r_y3": 632.362, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.246, "r_y0": 641.232, "r_x1": 432.91, "r_y1": 641.232, "r_x2": 432.91, "r_y2": 632.6800000000001, "r_x3": 407.246, "r_y3": 632.6800000000001, "coord_origin": "TOPLEFT"}, "text": "' and '", "orig": "' and '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 432.908, "r_y0": 641.068, "r_x1": 440.657, "r_y1": 641.068, "r_x2": 440.657, "r_y2": 632.362, "r_x3": 432.908, "r_y3": 632.362, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.657, "r_y0": 641.232, "r_x1": 545.115, "r_y1": 641.232, "r_x2": 545.115, "r_y2": 632.6800000000001, "r_x3": 440.657, "r_y3": 632.6800000000001, "coord_origin": "TOPLEFT"}, "text": "' HTMLstructure tags be-", "orig": "' HTMLstructure tags be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.187, "r_x1": 398.964, "r_y1": 653.187, "r_x2": 398.964, "r_y2": 644.635, "r_x3": 308.862, "r_y3": 644.635, "coord_origin": "TOPLEFT"}, "text": "come the object query.", "orig": "come the object query.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 665.246, "r_x1": 444.343, "r_y1": 665.246, "r_x2": 444.343, "r_y2": 656.694, "r_x3": 320.817, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "The encoding generated by the", "orig": "The encoding generated by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 447.006, "r_y0": 665.103, "r_x1": 545.108, "r_y1": 665.103, "r_x2": 545.108, "r_y2": 656.515, "r_x3": 447.006, "r_y3": 656.515, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 308.862, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "along with the features acquired for every data cell from the", "orig": "along with the features acquired for every data cell from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 308.862, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "Transformer Decoder are then passed to the attention net-", "orig": "Transformer Decoder are then passed to the attention net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "work. The attention network takes both inputs and learns to", "orig": "work. The attention network takes both inputs and learns to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 203, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 470.425, "r_y1": 713.066, "r_x2": 470.425, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "provide an attention weighted encoding.", "orig": "provide an attention weighted encoding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 204, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 474.63, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 474.63, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "This weighted at-", "orig": "This weighted at-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 205, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 7, "label": "picture", "bbox": {"l": 74.30525970458984, "t": 77.91120147705078, "r": 519.9801025390625, "b": 183.70150756835938, "coord_origin": "TOPLEFT"}, "confidence": 0.9296807646751404, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 125.61699999999996, "r_x1": 84.524, "r_y1": 125.61699999999996, "r_x2": 84.524, "r_y2": 122.481, "r_x3": 81.688, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 125.61699999999996, "r_x1": 93.026, "r_y1": 125.61699999999996, "r_x2": 93.026, "r_y2": 122.481, "r_x3": 86.413, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 102.505, "r_y0": 118.42999999999995, "r_x1": 115.346, "r_y1": 118.42999999999995, "r_x2": 115.346, "r_y2": 115.293, "r_x3": 102.505, "r_y3": 115.293, "coord_origin": "TOPLEFT"}, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.14, "r_y0": 118.39200000000005, "r_x1": 93.292, "r_y1": 118.39200000000005, "r_x2": 93.292, "r_y2": 115.25599999999997, "r_x3": 82.14, "r_y3": 115.25599999999997, "coord_origin": "TOPLEFT"}, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 125.61699999999996, "r_x1": 104.312, "r_y1": 125.61699999999996, "r_x2": 104.312, "r_y2": 122.481, "r_x3": 96.748, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 130.92100000000005, "r_x1": 102.421, "r_y1": 130.92100000000005, "r_x2": 102.421, "r_y2": 127.78499999999997, "r_x3": 96.748, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 136.63300000000004, "r_x1": 104.312, "r_y1": 136.63300000000004, "r_x2": 104.312, "r_y2": 133.49699999999996, "r_x3": 96.748, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 142.34500000000003, "r_x1": 102.421, "r_y1": 142.34500000000003, "r_x2": 102.421, "r_y2": 139.20899999999995, "r_x3": 96.748, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 125.61699999999996, "r_x1": 116.144, "r_y1": 125.61699999999996, "r_x2": 116.144, "r_y2": 122.481, "r_x3": 110.661, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 130.92100000000005, "r_x1": 116.144, "r_y1": 130.92100000000005, "r_x2": 116.144, "r_y2": 127.78499999999997, "r_x3": 110.661, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 136.63300000000004, "r_x1": 116.144, "r_y1": 136.63300000000004, "r_x2": 116.144, "r_y2": 133.49699999999996, "r_x3": 110.661, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 142.34500000000003, "r_x1": 116.144, "r_y1": 142.34500000000003, "r_x2": 116.144, "r_y2": 139.20899999999995, "r_x3": 110.661, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 130.92100000000005, "r_x1": 84.524, "r_y1": 130.92100000000005, "r_x2": 84.524, "r_y2": 127.78499999999997, "r_x3": 81.688, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 130.92100000000005, "r_x1": 93.026, "r_y1": 130.92100000000005, "r_x2": 93.026, "r_y2": 127.78499999999997, "r_x3": 86.413, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 136.63300000000004, "r_x1": 84.524, "r_y1": 136.63300000000004, "r_x2": 84.524, "r_y2": 133.49699999999996, "r_x3": 81.688, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 136.63300000000004, "r_x1": 93.026, "r_y1": 136.63300000000004, "r_x2": 93.026, "r_y2": 133.49699999999996, "r_x3": 86.413, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 142.34500000000003, "r_x1": 84.524, "r_y1": 142.34500000000003, "r_x2": 84.524, "r_y2": 139.20899999999995, "r_x3": 81.688, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 142.34500000000003, "r_x1": 93.026, "r_y1": 142.34500000000003, "r_x2": 93.026, "r_y2": 139.20899999999995, "r_x3": 86.413, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.084, "r_y0": 96.21699999999998, "r_x1": 113.936, "r_y1": 96.21699999999998, "r_x2": 113.936, "r_y2": 90.57100000000003, "r_x3": 88.084, "r_y3": 90.57100000000003, "coord_origin": "TOPLEFT"}, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.81, "r_y0": 103.35699999999997, "r_x1": 119.212, "r_y1": 103.35699999999997, "r_x2": 119.212, "r_y2": 97.71100000000001, "r_x3": 82.81, "r_y3": 97.71100000000001, "coord_origin": "TOPLEFT"}, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.942, "r_y0": 106.322, "r_x1": 180.011, "r_y1": 106.322, "r_x2": 180.011, "r_y2": 100.67600000000004, "r_x3": 143.942, "r_y3": 100.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.941, "r_y0": 113.46199999999999, "r_x1": 172.012, "r_y1": 113.46199999999999, "r_x2": 172.012, "r_y2": 107.81600000000003, "r_x3": 151.941, "r_y3": 107.81600000000003, "coord_origin": "TOPLEFT"}, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.769, "r_y0": 86.64999999999998, "r_x1": 266.396, "r_y1": 86.64999999999998, "r_x2": 266.396, "r_y2": 81.00400000000002, "r_x3": 251.769, "r_y3": 81.00400000000002, "coord_origin": "TOPLEFT"}, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.516, "r_y0": 91.75, "r_x1": 270.65, "r_y1": 91.75, "r_x2": 270.65, "r_y2": 86.10400000000004, "r_x3": 247.516, "r_y3": 86.10400000000004, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.037, "r_y0": 84.279, "r_x1": 352.126, "r_y1": 84.279, "r_x2": 352.126, "r_y2": 78.63300000000004, "r_x3": 331.037, "r_y3": 78.63300000000004, "coord_origin": "TOPLEFT"}, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.564, "r_y0": 101.75199999999995, "r_x1": 431.726, "r_y1": 101.75199999999995, "r_x2": 431.726, "r_y2": 96.106, "r_x3": 390.564, "r_y3": 96.106, "coord_origin": "TOPLEFT"}, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.824, "r_y0": 107.87199999999996, "r_x1": 435.47, "r_y1": 107.87199999999996, "r_x2": 435.47, "r_y2": 102.226, "r_x3": 386.824, "r_y3": 102.226, "coord_origin": "TOPLEFT"}, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 388.696, "r_y0": 113.99199999999996, "r_x1": 433.603, "r_y1": 113.99199999999996, "r_x2": 433.603, "r_y2": 108.346, "r_x3": 388.696, "r_y3": 108.346, "coord_origin": "TOPLEFT"}, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.078, "r_y0": 120.11199999999997, "r_x1": 431.225, "r_y1": 120.11199999999997, "r_x2": 431.225, "r_y2": 114.46600000000001, "r_x3": 391.078, "r_y3": 114.46600000000001, "coord_origin": "TOPLEFT"}, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.227, "r_y0": 157.40499999999997, "r_x1": 498.821, "r_y1": 157.40499999999997, "r_x2": 498.821, "r_y2": 151.75900000000001, "r_x3": 431.227, "r_y3": 151.75900000000001, "coord_origin": "TOPLEFT"}, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.174, "r_y0": 163.52499999999998, "r_x1": 498.878, "r_y1": 163.52499999999998, "r_x2": 498.878, "r_y2": 157.87900000000002, "r_x3": 431.174, "r_y3": 157.87900000000002, "coord_origin": "TOPLEFT"}, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.529, "r_y0": 169.64499999999998, "r_x1": 489.518, "r_y1": 169.64499999999998, "r_x2": 489.518, "r_y2": 163.99900000000002, "r_x3": 440.529, "r_y3": 163.99900000000002, "coord_origin": "TOPLEFT"}, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.375, "r_y0": 183.97299999999996, "r_x1": 367.723, "r_y1": 183.97299999999996, "r_x2": 367.723, "r_y2": 178.327, "r_x3": 328.375, "r_y3": 178.327, "coord_origin": "TOPLEFT"}, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.845, "r_y0": 129.62800000000004, "r_x1": 373.68, "r_y1": 129.62800000000004, "r_x2": 373.68, "r_y2": 123.98199999999997, "r_x3": 331.845, "r_y3": 123.98199999999997, "coord_origin": "TOPLEFT"}, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.845, "r_y0": 134.72799999999995, "r_x1": 381.178, "r_y1": 134.72799999999995, "r_x2": 381.178, "r_y2": 129.082, "r_x3": 331.845, "r_y3": 129.082, "coord_origin": "TOPLEFT"}, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.626, "r_y0": 93.83600000000001, "r_x1": 219.423, "r_y1": 93.83600000000001, "r_x2": 219.423, "r_y2": 88.19000000000005, "r_x3": 196.626, "r_y3": 88.19000000000005, "coord_origin": "TOPLEFT"}, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.668, "r_y0": 135.21400000000006, "r_x1": 271.499, "r_y1": 135.21400000000006, "r_x2": 271.499, "r_y2": 129.56799999999998, "r_x3": 246.668, "r_y3": 129.56799999999998, "coord_origin": "TOPLEFT"}, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.516, "r_y0": 140.31399999999996, "r_x1": 270.65, "r_y1": 140.31399999999996, "r_x2": 270.65, "r_y2": 134.668, "r_x3": 247.516, "r_y3": 134.668, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 94.73900000000003, "r_x1": 365.553, "r_y1": 94.73900000000003, "r_x2": 365.553, "r_y2": 89.09299999999996, "r_x3": 330.631, "r_y3": 89.09299999999996, "coord_origin": "TOPLEFT"}, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 102.899, "r_x1": 370.227, "r_y1": 102.899, "r_x2": 370.227, "r_y2": 97.25300000000004, "r_x3": 330.631, "r_y3": 97.25300000000004, "coord_origin": "TOPLEFT"}, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 111.05899999999997, "r_x1": 374.512, "r_y1": 111.05899999999997, "r_x2": 374.512, "r_y2": 105.41300000000001, "r_x3": 330.631, "r_y3": 105.41300000000001, "coord_origin": "TOPLEFT"}, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 119.21900000000005, "r_x1": 335.732, "r_y1": 119.21900000000005, "r_x2": 335.732, "r_y2": 113.57299999999998, "r_x3": 330.631, "r_y3": 113.57299999999998, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 146.558, "r_x1": 335.06, "r_y1": 146.558, "r_x2": 335.06, "r_y2": 141.85400000000004, "r_x3": 322.306, "r_y3": 141.85400000000004, "coord_origin": "TOPLEFT"}, "text": "<TR>", "orig": "<TR>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 153.69799999999998, "r_x1": 421.588, "r_y1": 153.69799999999998, "r_x2": 421.588, "r_y2": 148.99400000000003, "r_x3": 322.306, "r_y3": 148.99400000000003, "coord_origin": "TOPLEFT"}, "text": "<TD> 1 </TD><TD colspan=\"2\"> 2 </TD>", "orig": "<TD> 1 </TD><TD colspan=\"2\"> 2 </TD>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 160.83799999999997, "r_x1": 349.23, "r_y1": 160.83799999999997, "r_x2": 349.23, "r_y2": 156.13400000000001, "r_x3": 322.306, "r_y3": 156.13400000000001, "coord_origin": "TOPLEFT"}, "text": "</TR><TR>", "orig": "</TR><TR>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 167.97799999999995, "r_x1": 374.737, "r_y1": 167.97799999999995, "r_x2": 374.737, "r_y2": 163.274, "r_x3": 322.306, "r_y3": 163.274, "coord_origin": "TOPLEFT"}, "text": "<TD> 3 </TD><TD>...", "orig": "<TD> 3 </TD><TD>...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 175.11800000000005, "r_x1": 326.557, "r_y1": 175.11800000000005, "r_x2": 326.557, "r_y2": 170.414, "r_x3": 322.306, "r_y3": 170.414, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.511, "r_y0": 95.38900000000001, "r_x1": 326.914, "r_y1": 95.38900000000001, "r_x2": 326.914, "r_y2": 89.74300000000005, "r_x3": 323.511, "r_y3": 89.74300000000005, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.715, "r_y0": 103.50800000000004, "r_x1": 327.118, "r_y1": 103.50800000000004, "r_x2": 327.118, "r_y2": 97.86199999999997, "r_x3": 323.715, "r_y3": 97.86199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.715, "r_y0": 111.70899999999995, "r_x1": 327.118, "r_y1": 111.70899999999995, "r_x2": 327.118, "r_y2": 106.06299999999999, "r_x3": 323.715, "r_y3": 106.06299999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.464, "r_y0": 110.26499999999999, "r_x1": 457.867, "r_y1": 110.26499999999999, "r_x2": 457.867, "r_y2": 104.61900000000003, "r_x3": 454.464, "r_y3": 104.61900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.326, "r_y0": 96.81500000000005, "r_x1": 496.729, "r_y1": 96.81500000000005, "r_x2": 496.729, "r_y2": 91.16899999999998, "r_x3": 493.326, "r_y3": 91.16899999999998, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.083, "r_y0": 96.28800000000001, "r_x1": 457.486, "r_y1": 96.28800000000001, "r_x2": 457.486, "r_y2": 90.64200000000005, "r_x3": 454.083, "r_y3": 90.64200000000005, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 11, "label": "text", "bbox": {"l": 81.688, "t": 122.481, "r": 84.524, "b": 125.61699999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 125.61699999999996, "r_x1": 84.524, "r_y1": 125.61699999999996, "r_x2": 84.524, "r_y2": 122.481, "r_x3": 81.688, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "text", "bbox": {"l": 86.413, "t": 122.481, "r": 93.026, "b": 125.61699999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 125.61699999999996, "r_x1": 93.026, "r_y1": 125.61699999999996, "r_x2": 93.026, "r_y2": 122.481, "r_x3": 86.413, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "text", "bbox": {"l": 102.505, "t": 115.293, "r": 115.346, "b": 118.42999999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 102.505, "r_y0": 118.42999999999995, "r_x1": 115.346, "r_y1": 118.42999999999995, "r_x2": 115.346, "r_y2": 115.293, "r_x3": 102.505, "r_y3": 115.293, "coord_origin": "TOPLEFT"}, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "text", "bbox": {"l": 82.14, "t": 115.25599999999997, "r": 93.292, "b": 118.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.14, "r_y0": 118.39200000000005, "r_x1": 93.292, "r_y1": 118.39200000000005, "r_x2": 93.292, "r_y2": 115.25599999999997, "r_x3": 82.14, "r_y3": 115.25599999999997, "coord_origin": "TOPLEFT"}, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "text", "bbox": {"l": 96.748, "t": 122.481, "r": 104.312, "b": 125.61699999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 125.61699999999996, "r_x1": 104.312, "r_y1": 125.61699999999996, "r_x2": 104.312, "r_y2": 122.481, "r_x3": 96.748, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 96.748, "t": 127.78499999999997, "r": 102.421, "b": 130.92100000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 130.92100000000005, "r_x1": 102.421, "r_y1": 130.92100000000005, "r_x2": 102.421, "r_y2": 127.78499999999997, "r_x3": 96.748, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "text", "bbox": {"l": 96.748, "t": 133.49699999999996, "r": 104.312, "b": 136.63300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 136.63300000000004, "r_x1": 104.312, "r_y1": 136.63300000000004, "r_x2": 104.312, "r_y2": 133.49699999999996, "r_x3": 96.748, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 96.748, "t": 139.20899999999995, "r": 102.421, "b": 142.34500000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 142.34500000000003, "r_x1": 102.421, "r_y1": 142.34500000000003, "r_x2": 102.421, "r_y2": 139.20899999999995, "r_x3": 96.748, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 110.661, "t": 122.481, "r": 116.144, "b": 125.61699999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 125.61699999999996, "r_x1": 116.144, "r_y1": 125.61699999999996, "r_x2": 116.144, "r_y2": 122.481, "r_x3": 110.661, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 110.661, "t": 127.78499999999997, "r": 116.144, "b": 130.92100000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 130.92100000000005, "r_x1": 116.144, "r_y1": 130.92100000000005, "r_x2": 116.144, "r_y2": 127.78499999999997, "r_x3": 110.661, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 110.661, "t": 133.49699999999996, "r": 116.144, "b": 136.63300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 136.63300000000004, "r_x1": 116.144, "r_y1": 136.63300000000004, "r_x2": 116.144, "r_y2": 133.49699999999996, "r_x3": 110.661, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 110.661, "t": 139.20899999999995, "r": 116.144, "b": 142.34500000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 142.34500000000003, "r_x1": 116.144, "r_y1": 142.34500000000003, "r_x2": 116.144, "r_y2": 139.20899999999995, "r_x3": 110.661, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 81.688, "t": 127.78499999999997, "r": 84.524, "b": 130.92100000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 130.92100000000005, "r_x1": 84.524, "r_y1": 130.92100000000005, "r_x2": 84.524, "r_y2": 127.78499999999997, "r_x3": 81.688, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 86.413, "t": 127.78499999999997, "r": 93.026, "b": 130.92100000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 130.92100000000005, "r_x1": 93.026, "r_y1": 130.92100000000005, "r_x2": 93.026, "r_y2": 127.78499999999997, "r_x3": 86.413, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 81.688, "t": 133.49699999999996, "r": 84.524, "b": 136.63300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 136.63300000000004, "r_x1": 84.524, "r_y1": 136.63300000000004, "r_x2": 84.524, "r_y2": 133.49699999999996, "r_x3": 81.688, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 86.413, "t": 133.49699999999996, "r": 93.026, "b": 136.63300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 136.63300000000004, "r_x1": 93.026, "r_y1": 136.63300000000004, "r_x2": 93.026, "r_y2": 133.49699999999996, "r_x3": 86.413, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 81.688, "t": 139.20899999999995, "r": 84.524, "b": 142.34500000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 142.34500000000003, "r_x1": 84.524, "r_y1": 142.34500000000003, "r_x2": 84.524, "r_y2": 139.20899999999995, "r_x3": 81.688, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 86.413, "t": 139.20899999999995, "r": 93.026, "b": 142.34500000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 142.34500000000003, "r_x1": 93.026, "r_y1": 142.34500000000003, "r_x2": 93.026, "r_y2": 139.20899999999995, "r_x3": 86.413, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 88.084, "t": 90.57100000000003, "r": 113.936, "b": 96.21699999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.084, "r_y0": 96.21699999999998, "r_x1": 113.936, "r_y1": 96.21699999999998, "r_x2": 113.936, "r_y2": 90.57100000000003, "r_x3": 88.084, "r_y3": 90.57100000000003, "coord_origin": "TOPLEFT"}, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 82.81, "t": 97.71100000000001, "r": 119.212, "b": 103.35699999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.81, "r_y0": 103.35699999999997, "r_x1": 119.212, "r_y1": 103.35699999999997, "r_x2": 119.212, "r_y2": 97.71100000000001, "r_x3": 82.81, "r_y3": 97.71100000000001, "coord_origin": "TOPLEFT"}, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 143.942, "t": 100.67600000000004, "r": 180.011, "b": 106.322, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.942, "r_y0": 106.322, "r_x1": 180.011, "r_y1": 106.322, "r_x2": 180.011, "r_y2": 100.67600000000004, "r_x3": 143.942, "r_y3": 100.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 151.941, "t": 107.81600000000003, "r": 172.012, "b": 113.46199999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.941, "r_y0": 113.46199999999999, "r_x1": 172.012, "r_y1": 113.46199999999999, "r_x2": 172.012, "r_y2": 107.81600000000003, "r_x3": 151.941, "r_y3": 107.81600000000003, "coord_origin": "TOPLEFT"}, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 251.769, "t": 81.00400000000002, "r": 266.396, "b": 86.64999999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.769, "r_y0": 86.64999999999998, "r_x1": 266.396, "r_y1": 86.64999999999998, "r_x2": 266.396, "r_y2": 81.00400000000002, "r_x3": 251.769, "r_y3": 81.00400000000002, "coord_origin": "TOPLEFT"}, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 247.516, "t": 86.10400000000004, "r": 270.65, "b": 91.75, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.516, "r_y0": 91.75, "r_x1": 270.65, "r_y1": 91.75, "r_x2": 270.65, "r_y2": 86.10400000000004, "r_x3": 247.516, "r_y3": 86.10400000000004, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 331.037, "t": 78.63300000000004, "r": 352.126, "b": 84.279, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.037, "r_y0": 84.279, "r_x1": 352.126, "r_y1": 84.279, "r_x2": 352.126, "r_y2": 78.63300000000004, "r_x3": 331.037, "r_y3": 78.63300000000004, "coord_origin": "TOPLEFT"}, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 390.564, "t": 96.106, "r": 431.726, "b": 101.75199999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.564, "r_y0": 101.75199999999995, "r_x1": 431.726, "r_y1": 101.75199999999995, "r_x2": 431.726, "r_y2": 96.106, "r_x3": 390.564, "r_y3": 96.106, "coord_origin": "TOPLEFT"}, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 386.824, "t": 102.226, "r": 435.47, "b": 107.87199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.824, "r_y0": 107.87199999999996, "r_x1": 435.47, "r_y1": 107.87199999999996, "r_x2": 435.47, "r_y2": 102.226, "r_x3": 386.824, "r_y3": 102.226, "coord_origin": "TOPLEFT"}, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 388.696, "t": 108.346, "r": 433.603, "b": 113.99199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 388.696, "r_y0": 113.99199999999996, "r_x1": 433.603, "r_y1": 113.99199999999996, "r_x2": 433.603, "r_y2": 108.346, "r_x3": 388.696, "r_y3": 108.346, "coord_origin": "TOPLEFT"}, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 391.078, "t": 114.46600000000001, "r": 431.225, "b": 120.11199999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.078, "r_y0": 120.11199999999997, "r_x1": 431.225, "r_y1": 120.11199999999997, "r_x2": 431.225, "r_y2": 114.46600000000001, "r_x3": 391.078, "r_y3": 114.46600000000001, "coord_origin": "TOPLEFT"}, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 431.227, "t": 151.75900000000001, "r": 498.821, "b": 157.40499999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.227, "r_y0": 157.40499999999997, "r_x1": 498.821, "r_y1": 157.40499999999997, "r_x2": 498.821, "r_y2": 151.75900000000001, "r_x3": 431.227, "r_y3": 151.75900000000001, "coord_origin": "TOPLEFT"}, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 431.174, "t": 157.87900000000002, "r": 498.878, "b": 163.52499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.174, "r_y0": 163.52499999999998, "r_x1": 498.878, "r_y1": 163.52499999999998, "r_x2": 498.878, "r_y2": 157.87900000000002, "r_x3": 431.174, "r_y3": 157.87900000000002, "coord_origin": "TOPLEFT"}, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 440.529, "t": 163.99900000000002, "r": 489.518, "b": 169.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.529, "r_y0": 169.64499999999998, "r_x1": 489.518, "r_y1": 169.64499999999998, "r_x2": 489.518, "r_y2": 163.99900000000002, "r_x3": 440.529, "r_y3": 163.99900000000002, "coord_origin": "TOPLEFT"}, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 328.375, "t": 178.327, "r": 367.723, "b": 183.97299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.375, "r_y0": 183.97299999999996, "r_x1": 367.723, "r_y1": 183.97299999999996, "r_x2": 367.723, "r_y2": 178.327, "r_x3": 328.375, "r_y3": 178.327, "coord_origin": "TOPLEFT"}, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 331.845, "t": 123.98199999999997, "r": 373.68, "b": 129.62800000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.845, "r_y0": 129.62800000000004, "r_x1": 373.68, "r_y1": 129.62800000000004, "r_x2": 373.68, "r_y2": 123.98199999999997, "r_x3": 331.845, "r_y3": 123.98199999999997, "coord_origin": "TOPLEFT"}, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 331.845, "t": 129.082, "r": 381.178, "b": 134.72799999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.845, "r_y0": 134.72799999999995, "r_x1": 381.178, "r_y1": 134.72799999999995, "r_x2": 381.178, "r_y2": 129.082, "r_x3": 331.845, "r_y3": 129.082, "coord_origin": "TOPLEFT"}, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 196.626, "t": 88.19000000000005, "r": 219.423, "b": 93.83600000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.626, "r_y0": 93.83600000000001, "r_x1": 219.423, "r_y1": 93.83600000000001, "r_x2": 219.423, "r_y2": 88.19000000000005, "r_x3": 196.626, "r_y3": 88.19000000000005, "coord_origin": "TOPLEFT"}, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 246.668, "t": 129.56799999999998, "r": 271.499, "b": 135.21400000000006, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.668, "r_y0": 135.21400000000006, "r_x1": 271.499, "r_y1": 135.21400000000006, "r_x2": 271.499, "r_y2": 129.56799999999998, "r_x3": 246.668, "r_y3": 129.56799999999998, "coord_origin": "TOPLEFT"}, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 247.516, "t": 134.668, "r": 270.65, "b": 140.31399999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.516, "r_y0": 140.31399999999996, "r_x1": 270.65, "r_y1": 140.31399999999996, "r_x2": 270.65, "r_y2": 134.668, "r_x3": 247.516, "r_y3": 134.668, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 330.631, "t": 89.09299999999996, "r": 365.553, "b": 94.73900000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 94.73900000000003, "r_x1": 365.553, "r_y1": 94.73900000000003, "r_x2": 365.553, "r_y2": 89.09299999999996, "r_x3": 330.631, "r_y3": 89.09299999999996, "coord_origin": "TOPLEFT"}, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 330.631, "t": 97.25300000000004, "r": 370.227, "b": 102.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 102.899, "r_x1": 370.227, "r_y1": 102.899, "r_x2": 370.227, "r_y2": 97.25300000000004, "r_x3": 330.631, "r_y3": 97.25300000000004, "coord_origin": "TOPLEFT"}, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 330.631, "t": 105.41300000000001, "r": 374.512, "b": 111.05899999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 111.05899999999997, "r_x1": 374.512, "r_y1": 111.05899999999997, "r_x2": 374.512, "r_y2": 105.41300000000001, "r_x3": 330.631, "r_y3": 105.41300000000001, "coord_origin": "TOPLEFT"}, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 330.631, "t": 113.57299999999998, "r": 335.732, "b": 119.21900000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 119.21900000000005, "r_x1": 335.732, "r_y1": 119.21900000000005, "r_x2": 335.732, "r_y2": 113.57299999999998, "r_x3": 330.631, "r_y3": 113.57299999999998, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 322.306, "t": 141.85400000000004, "r": 335.06, "b": 146.558, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 146.558, "r_x1": 335.06, "r_y1": 146.558, "r_x2": 335.06, "r_y2": 141.85400000000004, "r_x3": 322.306, "r_y3": 141.85400000000004, "coord_origin": "TOPLEFT"}, "text": "<TR>", "orig": "<TR>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 322.306, "t": 148.99400000000003, "r": 421.588, "b": 153.69799999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 153.69799999999998, "r_x1": 421.588, "r_y1": 153.69799999999998, "r_x2": 421.588, "r_y2": 148.99400000000003, "r_x3": 322.306, "r_y3": 148.99400000000003, "coord_origin": "TOPLEFT"}, "text": "<TD> 1 </TD><TD colspan=\"2\"> 2 </TD>", "orig": "<TD> 1 </TD><TD colspan=\"2\"> 2 </TD>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 322.306, "t": 156.13400000000001, "r": 349.23, "b": 160.83799999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 160.83799999999997, "r_x1": 349.23, "r_y1": 160.83799999999997, "r_x2": 349.23, "r_y2": 156.13400000000001, "r_x3": 322.306, "r_y3": 156.13400000000001, "coord_origin": "TOPLEFT"}, "text": "</TR><TR>", "orig": "</TR><TR>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 322.306, "t": 163.274, "r": 374.737, "b": 167.97799999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 167.97799999999995, "r_x1": 374.737, "r_y1": 167.97799999999995, "r_x2": 374.737, "r_y2": 163.274, "r_x3": 322.306, "r_y3": 163.274, "coord_origin": "TOPLEFT"}, "text": "<TD> 3 </TD><TD>...", "orig": "<TD> 3 </TD><TD>...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 322.306, "t": 170.414, "r": 326.557, "b": 175.11800000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 175.11800000000005, "r_x1": 326.557, "r_y1": 175.11800000000005, "r_x2": 326.557, "r_y2": 170.414, "r_x3": 322.306, "r_y3": 170.414, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 323.511, "t": 89.74300000000005, "r": 326.914, "b": 95.38900000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.511, "r_y0": 95.38900000000001, "r_x1": 326.914, "r_y1": 95.38900000000001, "r_x2": 326.914, "r_y2": 89.74300000000005, "r_x3": 323.511, "r_y3": 89.74300000000005, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 323.715, "t": 97.86199999999997, "r": 327.118, "b": 103.50800000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.715, "r_y0": 103.50800000000004, "r_x1": 327.118, "r_y1": 103.50800000000004, "r_x2": 327.118, "r_y2": 97.86199999999997, "r_x3": 323.715, "r_y3": 97.86199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 323.715, "t": 106.06299999999999, "r": 327.118, "b": 111.70899999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.715, "r_y0": 111.70899999999995, "r_x1": 327.118, "r_y1": 111.70899999999995, "r_x2": 327.118, "r_y2": 106.06299999999999, "r_x3": 323.715, "r_y3": 106.06299999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 454.464, "t": 104.61900000000003, "r": 457.867, "b": 110.26499999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.464, "r_y0": 110.26499999999999, "r_x1": 457.867, "r_y1": 110.26499999999999, "r_x2": 457.867, "r_y2": 104.61900000000003, "r_x3": 454.464, "r_y3": 104.61900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 493.326, "t": 91.16899999999998, "r": 496.729, "b": 96.81500000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.326, "r_y0": 96.81500000000005, "r_x1": 496.729, "r_y1": 96.81500000000005, "r_x2": 496.729, "r_y2": 91.16899999999998, "r_x3": 493.326, "r_y3": 91.16899999999998, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 454.083, "t": 90.64200000000005, "r": 457.486, "b": 96.28800000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.083, "r_y0": 96.28800000000001, "r_x1": 457.486, "r_y1": 96.28800000000001, "r_x2": 457.486, "r_y2": 90.64200000000005, "r_x3": 454.083, "r_y3": 90.64200000000005, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 6, "label": "caption", "bbox": {"l": 50.112, "t": 203.986, "r": 545.108, "b": 224.88099999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.9677652716636658, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 212.92600000000004, "r_x1": 86.884, "r_y1": 212.92600000000004, "r_x2": 86.884, "r_y2": 204.37400000000002, "r_x3": 50.112, "r_y3": 204.37400000000002, "coord_origin": "TOPLEFT"}, "text": "Figure 3:", "orig": "Figure 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.021, "r_y0": 212.942, "r_x1": 149.851, "r_y1": 212.942, "r_x2": 149.851, "r_y2": 203.986, "r_x3": 94.021, "r_y3": 203.986, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.861, "r_y0": 212.92600000000004, "r_x1": 545.108, "r_y1": 212.92600000000004, "r_x2": 545.108, "r_y2": 204.37400000000002, "r_x3": 152.861, "r_y3": 204.37400000000002, "coord_origin": "TOPLEFT"}, "text": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "orig": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 224.88099999999997, "r_x1": 436.013, "r_y1": 224.88099999999997, "r_x2": 436.013, "r_y2": 216.32899999999995, "r_x3": 50.112, "r_y3": 216.32899999999995, "coord_origin": "TOPLEFT"}, "text": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "orig": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "picture", "bbox": {"l": 53.03328323364258, "t": 257.66534423828125, "r": 285.3731689453125, "b": 507.6688537597656, "coord_origin": "TOPLEFT"}, "confidence": 0.9724942445755005, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 74.253, "r_y0": 263.884, "r_x1": 101.758, "r_y1": 263.884, "r_x2": 101.758, "r_y2": 259.52, "r_x3": 74.253, "r_y3": 259.52, "coord_origin": "TOPLEFT"}, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.3, "r_y0": 264.015, "r_x1": 157.84, "r_y1": 264.015, "r_x2": 157.84, "r_y2": 259.65, "r_x3": 122.3, "r_y3": 259.65, "coord_origin": "TOPLEFT"}, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.549, "r_y0": 376.78, "r_x1": 125.684, "r_y1": 376.78, "r_x2": 125.684, "r_y2": 372.588, "r_x3": 78.549, "r_y3": 372.588, "coord_origin": "TOPLEFT"}, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.513, "r_y0": 396.713, "r_x1": 125.111, "r_y1": 396.713, "r_x2": 125.111, "r_y2": 392.52, "r_x3": 78.513, "r_y3": 392.52, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.025, "r_y0": 429.848, "r_x1": 127.923, "r_y1": 429.848, "r_x2": 127.923, "r_y2": 425.655, "r_x3": 76.025, "r_y3": 425.655, "coord_origin": "TOPLEFT"}, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.383, "r_y0": 450.284, "r_x1": 124.98, "r_y1": 450.284, "r_x2": 124.98, "r_y2": 446.091, "r_x3": 78.383, "r_y3": 446.091, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.469, "r_y0": 467.838, "r_x1": 181.629, "r_y1": 467.838, "r_x2": 181.629, "r_y2": 463.645, "r_x3": 167.469, "r_y3": 463.645, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 165.613, "r_y0": 483.866, "r_x1": 184.432, "r_y1": 483.866, "r_x2": 184.432, "r_y2": 479.673, "r_x3": 165.613, "r_y3": 479.673, "coord_origin": "TOPLEFT"}, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.32, "r_y0": 329.941, "r_x1": 132.925, "r_y1": 329.941, "r_x2": 132.925, "r_y2": 325.527, "r_x3": 65.32, "r_y3": 325.527, "coord_origin": "TOPLEFT"}, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.515, "r_y0": 274.491, "r_x1": 126.837, "r_y1": 274.491, "r_x2": 126.837, "r_y2": 270.73900000000003, "r_x3": 119.515, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "[30,", "orig": "[30,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.2, "r_y0": 274.491, "r_x1": 132.745, "r_y1": 274.491, "r_x2": 132.745, "r_y2": 270.73900000000003, "r_x3": 129.2, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "1,", "orig": "1,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 135.108, "r_y0": 274.491, "r_x1": 138.652, "r_y1": 274.491, "r_x2": 138.652, "r_y2": 270.73900000000003, "r_x3": 135.108, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "2,", "orig": "2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.015, "r_y0": 274.491, "r_x1": 144.56, "r_y1": 274.491, "r_x2": 144.56, "r_y2": 270.73900000000003, "r_x3": 141.015, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "3,", "orig": "3,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 146.923, "r_y0": 274.491, "r_x1": 160.625, "r_y1": 274.491, "r_x2": 160.625, "r_y2": 270.73900000000003, "r_x3": 146.923, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "4, \u20263,", "orig": "4, \u20263,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.729, "r_y0": 279.741, "r_x1": 132.273, "r_y1": 279.741, "r_x2": 132.273, "r_y2": 275.98900000000003, "r_x3": 128.729, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "4,", "orig": "4,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.636, "r_y0": 279.741, "r_x1": 138.181, "r_y1": 279.741, "r_x2": 138.181, "r_y2": 275.98900000000003, "r_x3": 134.636, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "5,", "orig": "5,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.544, "r_y0": 279.741, "r_x1": 151.411, "r_y1": 279.741, "r_x2": 151.411, "r_y2": 275.98900000000003, "r_x3": 140.544, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "8, 31]", "orig": "8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.434, "r_y0": 343.926, "r_x1": 79.019, "r_y1": 343.926, "r_x2": 79.019, "r_y2": 340.521, "r_x3": 60.434, "r_y3": 340.521, "coord_origin": "TOPLEFT"}, "text": "Positional", "orig": "Positional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.598, "r_y0": 348.352, "r_x1": 78.855, "r_y1": 348.352, "r_x2": 78.855, "r_y2": 344.948, "r_x3": 60.598, "r_y3": 344.948, "coord_origin": "TOPLEFT"}, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.829, "r_y0": 298.344, "r_x1": 153.414, "r_y1": 298.344, "r_x2": 153.414, "r_y2": 294.939, "r_x3": 134.829, "r_y3": 294.939, "coord_origin": "TOPLEFT"}, "text": "Positional", "orig": "Positional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.993, "r_y0": 302.77, "r_x1": 153.25, "r_y1": 302.77, "r_x2": 153.25, "r_y2": 299.365, "r_x3": 134.993, "r_y3": 299.365, "coord_origin": "TOPLEFT"}, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 350.753, "r_x1": 197.149, "r_y1": 350.753, "r_x2": 197.149, "r_y2": 346.56, "r_x3": 150.552, "r_y3": 346.56, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 399.818, "r_x1": 197.149, "r_y1": 399.818, "r_x2": 197.149, "r_y2": 395.625, "r_x3": 150.552, "r_y3": 395.625, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.185, "r_y0": 381.063, "r_x1": 197.32, "r_y1": 381.063, "r_x2": 197.32, "r_y2": 376.87, "r_x3": 150.185, "r_y3": 376.87, "coord_origin": "TOPLEFT"}, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 445.643, "r_x1": 197.149, "r_y1": 445.643, "r_x2": 197.149, "r_y2": 441.45, "r_x3": 150.552, "r_y3": 441.45, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.864, "r_y0": 427.488, "r_x1": 199.762, "r_y1": 427.488, "r_x2": 199.762, "r_y2": 423.295, "r_x3": 147.864, "r_y3": 423.295, "coord_origin": "TOPLEFT"}, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.566, "r_y0": 319.657, "r_x1": 255.725, "r_y1": 319.657, "r_x2": 255.725, "r_y2": 315.465, "r_x3": 241.566, "r_y3": 315.465, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.917, "r_y0": 366.759, "r_x1": 256.077, "r_y1": 366.759, "r_x2": 256.077, "r_y2": 362.567, "r_x3": 241.917, "r_y3": 362.567, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.054, "r_y0": 342.014, "r_x1": 269.393, "r_y1": 342.014, "r_x2": 269.393, "r_y2": 337.821, "r_x3": 228.054, "r_y3": 337.821, "coord_origin": "TOPLEFT"}, "text": "Attention Network", "orig": "Attention Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.446, "r_y0": 410.541, "r_x1": 238.739, "r_y1": 410.541, "r_x2": 238.739, "r_y2": 406.349, "r_x3": 228.446, "r_y3": 406.349, "coord_origin": "TOPLEFT"}, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.298, "r_y0": 410.598, "r_x1": 270.457, "r_y1": 410.598, "r_x2": 270.457, "r_y2": 406.405, "r_x3": 256.298, "r_y3": 406.405, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.545, "r_y0": 387.608, "r_x1": 258.089, "r_y1": 387.608, "r_x2": 258.089, "r_y2": 383.415, "r_x3": 239.545, "r_y3": 383.415, "coord_origin": "TOPLEFT"}, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 59.258, "r_y0": 449.783, "r_x1": 59.245, "r_y1": 384.871, "r_x2": 55.273, "r_y2": 384.872, "r_x3": 55.286, "r_y3": 449.784, "coord_origin": "TOPLEFT"}, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 59.058, "r_y0": 378.454, "r_x1": 59.055, "r_y1": 373.809, "r_x2": 55.345, "r_y2": 373.812, "r_x3": 55.348, "r_y3": 378.457, "coord_origin": "TOPLEFT"}, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.296, "r_y0": 490.108, "r_x1": 122.166, "r_y1": 490.098, "r_x2": 122.165, "r_y2": 485.687, "r_x3": 85.295, "r_y3": 485.697, "coord_origin": "TOPLEFT"}, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.666, "r_y0": 285.074, "r_x1": 265.321, "r_y1": 285.064, "r_x2": 265.32, "r_y2": 281.281, "r_x3": 229.665, "r_y3": 281.291, "coord_origin": "TOPLEFT"}, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.174, "r_y0": 505.871, "r_x1": 190.419, "r_y1": 505.862, "r_x2": 190.417, "r_y2": 501.45, "r_x3": 157.172, "r_y3": 501.459, "coord_origin": "TOPLEFT"}, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.816, "r_y0": 443.634, "r_x1": 269.396, "r_y1": 443.622, "r_x2": 269.395, "r_y2": 439.211, "r_x3": 227.815, "r_y3": 439.222, "coord_origin": "TOPLEFT"}, "text": "Bounding Boxes &", "orig": "Bounding Boxes &", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.703, "r_y0": 449.632, "r_x1": 263.513, "r_y1": 449.624, "r_x2": 263.511, "r_y2": 445.212, "r_x3": 233.701, "r_y3": 445.22, "coord_origin": "TOPLEFT"}, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.747, "r_y0": 298.506, "r_x1": 210.91, "r_y1": 298.506, "r_x2": 210.91, "r_y2": 294.534, "r_x3": 184.747, "r_y3": 294.534, "coord_origin": "TOPLEFT"}, "text": "Transformer", "orig": "Transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.912, "r_y0": 304.256, "r_x1": 216.744, "r_y1": 304.256, "r_x2": 216.744, "r_y2": 300.284, "r_x3": 178.912, "r_y3": 300.284, "coord_origin": "TOPLEFT"}, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.246, "r_y0": 287.601, "r_x1": 198.891, "r_y1": 287.601, "r_x2": 198.891, "r_y2": 283.891, "r_x3": 194.246, "r_y3": 283.891, "coord_origin": "TOPLEFT"}, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.456, "r_y0": 277.548, "r_x1": 276.471, "r_y1": 277.548, "r_x2": 276.471, "r_y2": 273.134, "r_x3": 221.456, "r_y3": 273.134, "coord_origin": "TOPLEFT"}, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.652, "r_y0": 328.837, "r_x1": 195.97, "r_y1": 328.837, "r_x2": 195.97, "r_y2": 324.644, "r_x3": 151.652, "r_y3": 324.644, "coord_origin": "TOPLEFT"}, "text": "Masked Multi-Head", "orig": "Masked Multi-Head", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.433, "r_y0": 334.837, "r_x1": 184.19, "r_y1": 334.837, "r_x2": 184.19, "r_y2": 330.644, "r_x3": 163.433, "r_y3": 330.644, "coord_origin": "TOPLEFT"}, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 64, "label": "text", "bbox": {"l": 74.253, "t": 259.52, "r": 101.758, "b": 263.884, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 74.253, "r_y0": 263.884, "r_x1": 101.758, "r_y1": 263.884, "r_x2": 101.758, "r_y2": 259.52, "r_x3": 74.253, "r_y3": 259.52, "coord_origin": "TOPLEFT"}, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 122.3, "t": 259.65, "r": 157.84, "b": 264.015, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.3, "r_y0": 264.015, "r_x1": 157.84, "r_y1": 264.015, "r_x2": 157.84, "r_y2": 259.65, "r_x3": 122.3, "r_y3": 259.65, "coord_origin": "TOPLEFT"}, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 78.549, "t": 372.588, "r": 125.684, "b": 376.78, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.549, "r_y0": 376.78, "r_x1": 125.684, "r_y1": 376.78, "r_x2": 125.684, "r_y2": 372.588, "r_x3": 78.549, "r_y3": 372.588, "coord_origin": "TOPLEFT"}, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 78.513, "t": 392.52, "r": 125.111, "b": 396.713, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.513, "r_y0": 396.713, "r_x1": 125.111, "r_y1": 396.713, "r_x2": 125.111, "r_y2": 392.52, "r_x3": 78.513, "r_y3": 392.52, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 76.025, "t": 425.655, "r": 127.923, "b": 429.848, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.025, "r_y0": 429.848, "r_x1": 127.923, "r_y1": 429.848, "r_x2": 127.923, "r_y2": 425.655, "r_x3": 76.025, "r_y3": 425.655, "coord_origin": "TOPLEFT"}, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 78.383, "t": 446.091, "r": 124.98, "b": 450.284, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.383, "r_y0": 450.284, "r_x1": 124.98, "r_y1": 450.284, "r_x2": 124.98, "r_y2": 446.091, "r_x3": 78.383, "r_y3": 446.091, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 167.469, "t": 463.645, "r": 181.629, "b": 467.838, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.469, "r_y0": 467.838, "r_x1": 181.629, "r_y1": 467.838, "r_x2": 181.629, "r_y2": 463.645, "r_x3": 167.469, "r_y3": 463.645, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 165.613, "t": 479.673, "r": 184.432, "b": 483.866, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 165.613, "r_y0": 483.866, "r_x1": 184.432, "r_y1": 483.866, "r_x2": 184.432, "r_y2": 479.673, "r_x3": 165.613, "r_y3": 479.673, "coord_origin": "TOPLEFT"}, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 65.32, "t": 325.527, "r": 132.925, "b": 329.941, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.32, "r_y0": 329.941, "r_x1": 132.925, "r_y1": 329.941, "r_x2": 132.925, "r_y2": 325.527, "r_x3": 65.32, "r_y3": 325.527, "coord_origin": "TOPLEFT"}, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 119.515, "t": 270.73900000000003, "r": 126.837, "b": 274.491, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.515, "r_y0": 274.491, "r_x1": 126.837, "r_y1": 274.491, "r_x2": 126.837, "r_y2": 270.73900000000003, "r_x3": 119.515, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "[30,", "orig": "[30,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 129.2, "t": 270.73900000000003, "r": 132.745, "b": 274.491, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.2, "r_y0": 274.491, "r_x1": 132.745, "r_y1": 274.491, "r_x2": 132.745, "r_y2": 270.73900000000003, "r_x3": 129.2, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "1,", "orig": "1,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 135.108, "t": 270.73900000000003, "r": 138.652, "b": 274.491, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 135.108, "r_y0": 274.491, "r_x1": 138.652, "r_y1": 274.491, "r_x2": 138.652, "r_y2": 270.73900000000003, "r_x3": 135.108, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "2,", "orig": "2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 141.015, "t": 270.73900000000003, "r": 144.56, "b": 274.491, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.015, "r_y0": 274.491, "r_x1": 144.56, "r_y1": 274.491, "r_x2": 144.56, "r_y2": 270.73900000000003, "r_x3": 141.015, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "3,", "orig": "3,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 146.923, "t": 270.73900000000003, "r": 160.625, "b": 274.491, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 146.923, "r_y0": 274.491, "r_x1": 160.625, "r_y1": 274.491, "r_x2": 160.625, "r_y2": 270.73900000000003, "r_x3": 146.923, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "4, \u20263,", "orig": "4, \u20263,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 128.729, "t": 275.98900000000003, "r": 132.273, "b": 279.741, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.729, "r_y0": 279.741, "r_x1": 132.273, "r_y1": 279.741, "r_x2": 132.273, "r_y2": 275.98900000000003, "r_x3": 128.729, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "4,", "orig": "4,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 134.636, "t": 275.98900000000003, "r": 138.181, "b": 279.741, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.636, "r_y0": 279.741, "r_x1": 138.181, "r_y1": 279.741, "r_x2": 138.181, "r_y2": 275.98900000000003, "r_x3": 134.636, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "5,", "orig": "5,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 140.544, "t": 275.98900000000003, "r": 151.411, "b": 279.741, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.544, "r_y0": 279.741, "r_x1": 151.411, "r_y1": 279.741, "r_x2": 151.411, "r_y2": 275.98900000000003, "r_x3": 140.544, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "8, 31]", "orig": "8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 60.434, "t": 340.521, "r": 79.019, "b": 343.926, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.434, "r_y0": 343.926, "r_x1": 79.019, "r_y1": 343.926, "r_x2": 79.019, "r_y2": 340.521, "r_x3": 60.434, "r_y3": 340.521, "coord_origin": "TOPLEFT"}, "text": "Positional", "orig": "Positional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 82, "label": "text", "bbox": {"l": 60.598, "t": 344.948, "r": 78.855, "b": 348.352, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.598, "r_y0": 348.352, "r_x1": 78.855, "r_y1": 348.352, "r_x2": 78.855, "r_y2": 344.948, "r_x3": 60.598, "r_y3": 344.948, "coord_origin": "TOPLEFT"}, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 83, "label": "text", "bbox": {"l": 134.829, "t": 294.939, "r": 153.414, "b": 298.344, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.829, "r_y0": 298.344, "r_x1": 153.414, "r_y1": 298.344, "r_x2": 153.414, "r_y2": 294.939, "r_x3": 134.829, "r_y3": 294.939, "coord_origin": "TOPLEFT"}, "text": "Positional", "orig": "Positional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 134.993, "t": 299.365, "r": 153.25, "b": 302.77, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.993, "r_y0": 302.77, "r_x1": 153.25, "r_y1": 302.77, "r_x2": 153.25, "r_y2": 299.365, "r_x3": 134.993, "r_y3": 299.365, "coord_origin": "TOPLEFT"}, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 150.552, "t": 346.56, "r": 197.149, "b": 350.753, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 350.753, "r_x1": 197.149, "r_y1": 350.753, "r_x2": 197.149, "r_y2": 346.56, "r_x3": 150.552, "r_y3": 346.56, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 86, "label": "text", "bbox": {"l": 150.552, "t": 395.625, "r": 197.149, "b": 399.818, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 399.818, "r_x1": 197.149, "r_y1": 399.818, "r_x2": 197.149, "r_y2": 395.625, "r_x3": 150.552, "r_y3": 395.625, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 150.185, "t": 376.87, "r": 197.32, "b": 381.063, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.185, "r_y0": 381.063, "r_x1": 197.32, "r_y1": 381.063, "r_x2": 197.32, "r_y2": 376.87, "r_x3": 150.185, "r_y3": 376.87, "coord_origin": "TOPLEFT"}, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 88, "label": "text", "bbox": {"l": 150.552, "t": 441.45, "r": 197.149, "b": 445.643, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 445.643, "r_x1": 197.149, "r_y1": 445.643, "r_x2": 197.149, "r_y2": 441.45, "r_x3": 150.552, "r_y3": 441.45, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 147.864, "t": 423.295, "r": 199.762, "b": 427.488, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.864, "r_y0": 427.488, "r_x1": 199.762, "r_y1": 427.488, "r_x2": 199.762, "r_y2": 423.295, "r_x3": 147.864, "r_y3": 423.295, "coord_origin": "TOPLEFT"}, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 241.566, "t": 315.465, "r": 255.725, "b": 319.657, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.566, "r_y0": 319.657, "r_x1": 255.725, "r_y1": 319.657, "r_x2": 255.725, "r_y2": 315.465, "r_x3": 241.566, "r_y3": 315.465, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 91, "label": "text", "bbox": {"l": 241.917, "t": 362.567, "r": 256.077, "b": 366.759, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.917, "r_y0": 366.759, "r_x1": 256.077, "r_y1": 366.759, "r_x2": 256.077, "r_y2": 362.567, "r_x3": 241.917, "r_y3": 362.567, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 92, "label": "text", "bbox": {"l": 228.054, "t": 337.821, "r": 269.393, "b": 342.014, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.054, "r_y0": 342.014, "r_x1": 269.393, "r_y1": 342.014, "r_x2": 269.393, "r_y2": 337.821, "r_x3": 228.054, "r_y3": 337.821, "coord_origin": "TOPLEFT"}, "text": "Attention Network", "orig": "Attention Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 93, "label": "text", "bbox": {"l": 228.446, "t": 406.349, "r": 238.739, "b": 410.541, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.446, "r_y0": 410.541, "r_x1": 238.739, "r_y1": 410.541, "r_x2": 238.739, "r_y2": 406.349, "r_x3": 228.446, "r_y3": 406.349, "coord_origin": "TOPLEFT"}, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 94, "label": "text", "bbox": {"l": 256.298, "t": 406.405, "r": 270.457, "b": 410.598, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.298, "r_y0": 410.598, "r_x1": 270.457, "r_y1": 410.598, "r_x2": 270.457, "r_y2": 406.405, "r_x3": 256.298, "r_y3": 406.405, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 95, "label": "text", "bbox": {"l": 239.545, "t": 383.415, "r": 258.089, "b": 387.608, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.545, "r_y0": 387.608, "r_x1": 258.089, "r_y1": 387.608, "r_x2": 258.089, "r_y2": 383.415, "r_x3": 239.545, "r_y3": 383.415, "coord_origin": "TOPLEFT"}, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 96, "label": "text", "bbox": {"l": 55.273, "t": 384.871, "r": 59.258, "b": 449.784, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 59.258, "r_y0": 449.783, "r_x1": 59.245, "r_y1": 384.871, "r_x2": 55.273, "r_y2": 384.872, "r_x3": 55.286, "r_y3": 449.784, "coord_origin": "TOPLEFT"}, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 97, "label": "text", "bbox": {"l": 55.345, "t": 373.809, "r": 59.058, "b": 378.457, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 59.058, "r_y0": 378.454, "r_x1": 59.055, "r_y1": 373.809, "r_x2": 55.345, "r_y2": 373.812, "r_x3": 55.348, "r_y3": 378.457, "coord_origin": "TOPLEFT"}, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 98, "label": "text", "bbox": {"l": 85.295, "t": 485.687, "r": 122.166, "b": 490.108, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.296, "r_y0": 490.108, "r_x1": 122.166, "r_y1": 490.098, "r_x2": 122.165, "r_y2": 485.687, "r_x3": 85.295, "r_y3": 485.697, "coord_origin": "TOPLEFT"}, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 99, "label": "text", "bbox": {"l": 229.665, "t": 281.281, "r": 265.321, "b": 285.074, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.666, "r_y0": 285.074, "r_x1": 265.321, "r_y1": 285.064, "r_x2": 265.32, "r_y2": 281.281, "r_x3": 229.665, "r_y3": 281.291, "coord_origin": "TOPLEFT"}, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 100, "label": "text", "bbox": {"l": 157.172, "t": 501.45, "r": 190.419, "b": 505.871, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.174, "r_y0": 505.871, "r_x1": 190.419, "r_y1": 505.862, "r_x2": 190.417, "r_y2": 501.45, "r_x3": 157.172, "r_y3": 501.459, "coord_origin": "TOPLEFT"}, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 101, "label": "text", "bbox": {"l": 227.815, "t": 439.211, "r": 269.396, "b": 443.634, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.816, "r_y0": 443.634, "r_x1": 269.396, "r_y1": 443.622, "r_x2": 269.395, "r_y2": 439.211, "r_x3": 227.815, "r_y3": 439.222, "coord_origin": "TOPLEFT"}, "text": "Bounding Boxes &", "orig": "Bounding Boxes &", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 102, "label": "text", "bbox": {"l": 233.701, "t": 445.212, "r": 263.513, "b": 449.632, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.703, "r_y0": 449.632, "r_x1": 263.513, "r_y1": 449.624, "r_x2": 263.511, "r_y2": 445.212, "r_x3": 233.701, "r_y3": 445.22, "coord_origin": "TOPLEFT"}, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 103, "label": "text", "bbox": {"l": 184.747, "t": 294.534, "r": 210.91, "b": 298.506, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.747, "r_y0": 298.506, "r_x1": 210.91, "r_y1": 298.506, "r_x2": 210.91, "r_y2": 294.534, "r_x3": 184.747, "r_y3": 294.534, "coord_origin": "TOPLEFT"}, "text": "Transformer", "orig": "Transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 104, "label": "text", "bbox": {"l": 178.912, "t": 300.284, "r": 216.744, "b": 304.256, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.912, "r_y0": 304.256, "r_x1": 216.744, "r_y1": 304.256, "r_x2": 216.744, "r_y2": 300.284, "r_x3": 178.912, "r_y3": 300.284, "coord_origin": "TOPLEFT"}, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 105, "label": "text", "bbox": {"l": 194.246, "t": 283.891, "r": 198.891, "b": 287.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.246, "r_y0": 287.601, "r_x1": 198.891, "r_y1": 287.601, "r_x2": 198.891, "r_y2": 283.891, "r_x3": 194.246, "r_y3": 283.891, "coord_origin": "TOPLEFT"}, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 106, "label": "text", "bbox": {"l": 221.456, "t": 273.134, "r": 276.471, "b": 277.548, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.456, "r_y0": 277.548, "r_x1": 276.471, "r_y1": 277.548, "r_x2": 276.471, "r_y2": 273.134, "r_x3": 221.456, "r_y3": 273.134, "coord_origin": "TOPLEFT"}, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 107, "label": "text", "bbox": {"l": 151.652, "t": 324.644, "r": 195.97, "b": 328.837, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.652, "r_y0": 328.837, "r_x1": 195.97, "r_y1": 328.837, "r_x2": 195.97, "r_y2": 324.644, "r_x3": 151.652, "r_y3": 324.644, "coord_origin": "TOPLEFT"}, "text": "Masked Multi-Head", "orig": "Masked Multi-Head", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 108, "label": "text", "bbox": {"l": 163.433, "t": 330.644, "r": 184.19, "b": 334.837, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.433, "r_y0": 334.837, "r_x1": 184.19, "r_y1": 334.837, "r_x2": 184.19, "r_y2": 330.644, "r_x3": 163.433, "r_y3": 330.644, "coord_origin": "TOPLEFT"}, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 8, "label": "caption", "bbox": {"l": 50.112, "t": 527.783, "r": 286.366, "b": 680.185, "coord_origin": "TOPLEFT"}, "confidence": 0.8913407325744629, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 536.723, "r_x1": 85.878, "r_y1": 536.723, "r_x2": 85.878, "r_y2": 528.171, "r_x3": 50.112, "r_y3": 528.171, "coord_origin": "TOPLEFT"}, "text": "Figure 4:", "orig": "Figure 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 90.73, "r_y0": 536.723, "r_x1": 229.787, "r_y1": 536.723, "r_x2": 229.787, "r_y2": 528.171, "r_x3": 90.73, "r_y3": 528.171, "coord_origin": "TOPLEFT"}, "text": "Given an input image of a table, the", "orig": "Given an input image of a table, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 231.787, "r_y0": 536.739, "r_x1": 267.762, "r_y1": 536.739, "r_x2": 267.762, "r_y2": 527.783, "r_x3": 231.787, "r_y3": 527.783, "coord_origin": "TOPLEFT"}, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 269.764, "r_y0": 536.723, "r_x1": 286.362, "r_y1": 536.723, "r_x2": 286.362, "r_y2": 528.171, "r_x3": 269.764, "r_y3": 528.171, "coord_origin": "TOPLEFT"}, "text": "pro-", "orig": "pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 548.678, "r_x1": 286.365, "r_y1": 548.678, "r_x2": 286.365, "r_y2": 540.126, "r_x3": 50.112, "r_y3": 540.126, "coord_origin": "TOPLEFT"}, "text": "duces fixed-length features that represent the input image.", "orig": "duces fixed-length features that represent the input image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 560.634, "r_x1": 205.847, "r_y1": 560.634, "r_x2": 205.847, "r_y2": 552.082, "r_x3": 50.112, "r_y3": 552.082, "coord_origin": "TOPLEFT"}, "text": "The features are then passed to both the", "orig": "The features are then passed to both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.018, "r_y0": 560.65, "r_x1": 286.364, "r_y1": 560.65, "r_x2": 286.364, "r_y2": 551.694, "r_x3": 208.018, "r_y3": 551.694, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 572.5889999999999, "r_x1": 64.498, "r_y1": 572.5889999999999, "r_x2": 64.498, "r_y2": 564.037, "r_x3": 50.112, "r_y3": 564.037, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 68.165, "r_y0": 572.605, "r_x1": 151.313, "r_y1": 572.605, "r_x2": 151.313, "r_y2": 563.649, "r_x3": 68.165, "r_y3": 563.649, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.313, "r_y0": 572.5889999999999, "r_x1": 153.804, "r_y1": 572.5889999999999, "r_x2": 153.804, "r_y2": 564.037, "r_x3": 151.313, "r_y3": 564.037, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.419, "r_y0": 572.5889999999999, "r_x1": 241.933, "r_y1": 572.5889999999999, "r_x2": 241.933, "r_y2": 564.037, "r_x3": 160.419, "r_y3": 564.037, "coord_origin": "TOPLEFT"}, "text": "During training, the", "orig": "During training, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.595, "r_y0": 572.605, "r_x1": 286.362, "r_y1": 572.605, "r_x2": 286.362, "r_y2": 563.649, "r_x3": 245.595, "r_y3": 563.649, "coord_origin": "TOPLEFT"}, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 584.56, "r_x1": 85.519, "r_y1": 584.56, "r_x2": 85.519, "r_y2": 575.604, "r_x3": 50.112, "r_y3": 575.604, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.623, "r_y0": 584.544, "r_x1": 286.361, "r_y1": 584.544, "r_x2": 286.361, "r_y2": 575.992, "r_x3": 88.623, "r_y3": 575.992, "coord_origin": "TOPLEFT"}, "text": "receives 'tokenized tags' of the HTML code that", "orig": "receives 'tokenized tags' of the HTML code that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 596.499, "r_x1": 286.365, "r_y1": 596.499, "r_x2": 286.365, "r_y2": 587.947, "r_x3": 50.112, "r_y3": 587.947, "coord_origin": "TOPLEFT"}, "text": "represent the table structure. Afterwards, a transformer en-", "orig": "represent the table structure. Afterwards, a transformer en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 608.454, "r_x1": 286.365, "r_y1": 608.454, "r_x2": 286.365, "r_y2": 599.902, "r_x3": 50.112, "r_y3": 599.902, "coord_origin": "TOPLEFT"}, "text": "coder and decoder architecture is employed to produce fea-", "orig": "coder and decoder architecture is employed to produce fea-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 620.409, "r_x1": 240.438, "r_y1": 620.409, "r_x2": 240.438, "r_y2": 611.857, "r_x3": 50.112, "r_y3": 611.857, "coord_origin": "TOPLEFT"}, "text": "tures that are received by a linear layer, and the", "orig": "tures that are received by a linear layer, and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.198, "r_y0": 620.425, "r_x1": 286.366, "r_y1": 620.425, "r_x2": 286.366, "r_y2": 611.469, "r_x3": 243.198, "r_y3": 611.469, "coord_origin": "TOPLEFT"}, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 632.381, "r_x1": 87.013, "r_y1": 632.381, "r_x2": 87.013, "r_y2": 623.425, "r_x3": 50.112, "r_y3": 623.425, "coord_origin": "TOPLEFT"}, "text": "Decoder.", "orig": "Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.14, "r_y0": 632.381, "r_x1": 286.365, "r_y1": 632.381, "r_x2": 286.365, "r_y2": 623.425, "r_x3": 93.14, "r_y3": 623.425, "coord_origin": "TOPLEFT"}, "text": "The linear layer is applied to the features to", "orig": "The linear layer is applied to the features to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 644.336, "r_x1": 286.365, "r_y1": 644.336, "r_x2": 286.365, "r_y2": 635.38, "r_x3": 50.112, "r_y3": 635.38, "coord_origin": "TOPLEFT"}, "text": "predict the tags. Simultaneously, the Cell BBox Decoder", "orig": "predict the tags. Simultaneously, the Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 656.275, "r_x1": 220.582, "r_y1": 656.275, "r_x2": 220.582, "r_y2": 647.723, "r_x3": 50.112, "r_y3": 647.723, "coord_origin": "TOPLEFT"}, "text": "selects features referring to the data cells ('", "orig": "selects features referring to the data cells ('", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.578, "r_y0": 656.111, "r_x1": 228.327, "r_y1": 656.111, "r_x2": 228.327, "r_y2": 647.405, "r_x3": 220.578, "r_y3": 647.405, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.327, "r_y0": 656.275, "r_x1": 236.078, "r_y1": 656.275, "r_x2": 236.078, "r_y2": 647.723, "r_x3": 228.327, "r_y3": 647.723, "coord_origin": "TOPLEFT"}, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.078, "r_y0": 656.111, "r_x1": 243.827, "r_y1": 656.111, "r_x2": 243.827, "r_y2": 647.405, "r_x3": 236.078, "r_y3": 647.405, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.826, "r_y0": 656.275, "r_x1": 255.293, "r_y1": 656.275, "r_x2": 255.293, "r_y2": 647.723, "r_x3": 243.826, "r_y3": 647.723, "coord_origin": "TOPLEFT"}, "text": "', '", "orig": "', '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.291, "r_y0": 656.111, "r_x1": 263.04, "r_y1": 656.111, "r_x2": 263.04, "r_y2": 647.405, "r_x3": 255.291, "r_y3": 647.405, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.04, "r_y0": 656.275, "r_x1": 286.362, "r_y1": 656.275, "r_x2": 286.362, "r_y2": 647.723, "r_x3": 263.04, "r_y3": 647.723, "coord_origin": "TOPLEFT"}, "text": "') and", "orig": "') and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 668.23, "r_x1": 286.365, "r_y1": 668.23, "r_x2": 286.365, "r_y2": 659.678, "r_x3": 50.112, "r_y3": 659.678, "coord_origin": "TOPLEFT"}, "text": "passes them through an attention network, an MLP, and a", "orig": "passes them through an attention network, an MLP, and a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 680.185, "r_x1": 218.47, "r_y1": 680.185, "r_x2": 218.47, "r_y2": 671.633, "r_x3": 50.112, "r_y3": 671.633, "coord_origin": "TOPLEFT"}, "text": "linear layer to predict the bounding boxes.", "orig": "linear layer to predict the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "text", "bbox": {"l": 308.862, "t": 249.803, "r": 545.115, "b": 294.221, "coord_origin": "TOPLEFT"}, "confidence": 0.9831458330154419, "cells": [{"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.355, "r_x1": 545.115, "r_y1": 258.355, "r_x2": 545.115, "r_y2": 249.803, "r_x3": 308.862, "r_y3": 249.803, "coord_origin": "TOPLEFT"}, "text": "forming classification, and adding an adaptive pooling layer", "orig": "forming classification, and adding an adaptive pooling layer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 270.31100000000004, "r_x1": 366.466, "r_y1": 270.31100000000004, "r_x2": 366.466, "r_y2": 261.759, "r_x3": 308.862, "r_y3": 261.759, "coord_origin": "TOPLEFT"}, "text": "of size 28*28.", "orig": "of size 28*28.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 371.706, "r_y0": 270.31100000000004, "r_x1": 545.115, "r_y1": 270.31100000000004, "r_x2": 545.115, "r_y2": 261.759, "r_x3": 371.706, "r_y3": 261.759, "coord_origin": "TOPLEFT"}, "text": "ResNet by default downsamples the image", "orig": "ResNet by default downsamples the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 282.266, "r_x1": 545.115, "r_y1": 282.266, "r_x2": 545.115, "r_y2": 273.71400000000006, "r_x3": 308.862, "r_y3": 273.71400000000006, "coord_origin": "TOPLEFT"}, "text": "resolution by 32 and then the encoded image is provided to", "orig": "resolution by 32 and then the encoded image is provided to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 294.221, "r_x1": 341.24, "r_y1": 294.221, "r_x2": 341.24, "r_y2": 285.669, "r_x3": 308.862, "r_y3": 285.669, "coord_origin": "TOPLEFT"}, "text": "both the", "orig": "both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 343.731, "r_y0": 294.078, "r_x1": 417.235, "r_y1": 294.078, "r_x2": 417.235, "r_y2": 285.49, "r_x3": 343.731, "r_y3": 285.49, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.234, "r_y0": 294.221, "r_x1": 436.601, "r_y1": 294.221, "r_x2": 436.601, "r_y2": 285.669, "r_x3": 417.234, "r_y3": 285.669, "coord_origin": "TOPLEFT"}, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.092, "r_y0": 294.078, "r_x1": 516.561, "r_y1": 294.078, "r_x2": 516.561, "r_y2": 285.49, "r_x3": 439.092, "r_y3": 285.49, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.561, "r_y0": 294.221, "r_x1": 519.052, "r_y1": 294.221, "r_x2": 519.052, "r_y2": 285.669, "r_x3": 516.561, "r_y3": 285.669, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 308.862, "t": 297.34, "r": 545.115, "b": 413.876, "coord_origin": "TOPLEFT"}, "confidence": 0.9862009882926941, "cells": [{"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 306.296, "r_x1": 400.866, "r_y1": 306.296, "r_x2": 400.866, "r_y2": 297.34, "r_x3": 320.817, "r_y3": 297.34, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder.", "orig": "Structure Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 403.914, "r_y0": 306.28, "r_x1": 545.114, "r_y1": 306.28, "r_x2": 545.114, "r_y2": 297.728, "r_x3": 403.914, "r_y3": 297.728, "coord_origin": "TOPLEFT"}, "text": "The transformer architecture of this", "orig": "The transformer architecture of this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 318.235, "r_x1": 517.529, "r_y1": 318.235, "r_x2": 517.529, "r_y2": 309.683, "r_x3": 308.862, "r_y3": 309.683, "coord_origin": "TOPLEFT"}, "text": "component is based on the work proposed in [31].", "orig": "component is based on the work proposed in [31].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 524.094, "r_y0": 318.235, "r_x1": 545.115, "r_y1": 318.235, "r_x2": 545.115, "r_y2": 309.683, "r_x3": 524.094, "r_y3": 309.683, "coord_origin": "TOPLEFT"}, "text": "After", "orig": "After", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 330.19, "r_x1": 432.358, "r_y1": 330.19, "r_x2": 432.358, "r_y2": 321.638, "r_x3": 308.862, "r_y3": 321.638, "coord_origin": "TOPLEFT"}, "text": "extensive experimentation, the", "orig": "extensive experimentation, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.82, "r_y0": 330.047, "r_x1": 510.29, "r_y1": 330.047, "r_x2": 510.29, "r_y2": 321.459, "r_x3": 435.82, "r_y3": 321.459, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.978, "r_y0": 330.19, "r_x1": 520.623, "r_y1": 330.19, "r_x2": 520.623, "r_y2": 321.638, "r_x3": 513.978, "r_y3": 321.638, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 524.08, "r_y0": 330.19, "r_x1": 545.111, "r_y1": 330.19, "r_x2": 545.111, "r_y2": 321.638, "r_x3": 524.08, "r_y3": 321.638, "coord_origin": "TOPLEFT"}, "text": "mod-", "orig": "mod-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 342.145, "r_x1": 545.115, "r_y1": 342.145, "r_x2": 545.115, "r_y2": 333.593, "r_x3": 308.862, "r_y3": 333.593, "coord_origin": "TOPLEFT"}, "text": "eled as a transformer encoder with two encoder layers and", "orig": "eled as a transformer encoder with two encoder layers and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 354.1, "r_x1": 545.115, "r_y1": 354.1, "r_x2": 545.115, "r_y2": 345.548, "r_x3": 308.862, "r_y3": 345.548, "coord_origin": "TOPLEFT"}, "text": "a transformer decoder made from a stack of 4 decoder lay-", "orig": "a transformer decoder made from a stack of 4 decoder lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 366.056, "r_x1": 545.115, "r_y1": 366.056, "r_x2": 545.115, "r_y2": 357.504, "r_x3": 308.862, "r_y3": 357.504, "coord_origin": "TOPLEFT"}, "text": "ers that comprise mainly of multi-head attention and feed", "orig": "ers that comprise mainly of multi-head attention and feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 378.011, "r_x1": 370.391, "r_y1": 378.011, "r_x2": 370.391, "r_y2": 369.459, "r_x3": 308.862, "r_y3": 369.459, "coord_origin": "TOPLEFT"}, "text": "forward layers.", "orig": "forward layers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.445, "r_y0": 378.011, "r_x1": 545.115, "r_y1": 378.011, "r_x2": 545.115, "r_y2": 369.459, "r_x3": 377.445, "r_y3": 369.459, "coord_origin": "TOPLEFT"}, "text": "This configuration uses fewer layers and", "orig": "This configuration uses fewer layers and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 389.966, "r_x1": 545.115, "r_y1": 389.966, "r_x2": 545.115, "r_y2": 381.414, "r_x3": 308.862, "r_y3": 381.414, "coord_origin": "TOPLEFT"}, "text": "heads in comparison to networks applied to other problems", "orig": "heads in comparison to networks applied to other problems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 401.921, "r_x1": 326.566, "r_y1": 401.921, "r_x2": 326.566, "r_y2": 393.369, "r_x3": 308.862, "r_y3": 393.369, "coord_origin": "TOPLEFT"}, "text": "(e.g.", "orig": "(e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.069, "r_y0": 401.921, "r_x1": 545.115, "r_y1": 401.921, "r_x2": 545.115, "r_y2": 393.369, "r_x3": 331.069, "r_y3": 393.369, "coord_origin": "TOPLEFT"}, "text": "'Scene Understanding', 'Image Captioning'), some-", "orig": "'Scene Understanding', 'Image Captioning'), some-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 413.876, "r_x1": 528.019, "r_y1": 413.876, "r_x2": 528.019, "r_y2": 405.324, "r_x3": 308.862, "r_y3": 405.324, "coord_origin": "TOPLEFT"}, "text": "thing which we relate to the simplicity of table images.", "orig": "thing which we relate to the simplicity of table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 308.862, "t": 417.383, "r": 545.115, "b": 545.487, "coord_origin": "TOPLEFT"}, "confidence": 0.9851906895637512, "cells": [{"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 425.935, "r_x1": 336.309, "r_y1": 425.935, "r_x2": 336.309, "r_y2": 417.383, "r_x3": 320.817, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.579, "r_y0": 425.935, "r_x1": 388.055, "r_y1": 425.935, "r_x2": 388.055, "r_y2": 417.383, "r_x3": 341.579, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "transformer", "orig": "transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.325, "r_y0": 425.935, "r_x1": 424.856, "r_y1": 425.935, "r_x2": 424.856, "r_y2": 417.383, "r_x3": 393.325, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "encoder", "orig": "encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.117, "r_y0": 425.935, "r_x1": 462.356, "r_y1": 425.935, "r_x2": 462.356, "r_y2": 417.383, "r_x3": 430.117, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "receives", "orig": "receives", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 467.626, "r_y0": 425.935, "r_x1": 477.031, "r_y1": 425.935, "r_x2": 477.031, "r_y2": 417.383, "r_x3": 467.626, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "an", "orig": "an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 482.301, "r_y0": 425.935, "r_x1": 515.496, "r_y1": 425.935, "r_x2": 515.496, "r_y2": 417.383, "r_x3": 482.301, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "encoded", "orig": "encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 520.766, "r_y0": 425.935, "r_x1": 545.115, "r_y1": 425.935, "r_x2": 545.115, "r_y2": 417.383, "r_x3": 520.766, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 437.89, "r_x1": 343.721, "r_y1": 437.89, "r_x2": 343.721, "r_y2": 429.338, "r_x3": 308.862, "r_y3": 429.338, "coord_origin": "TOPLEFT"}, "text": "from the", "orig": "from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.038, "r_y0": 437.747, "r_x1": 446.455, "r_y1": 437.747, "r_x2": 446.455, "r_y2": 429.159, "r_x3": 347.038, "r_y3": 429.159, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.94, "r_y0": 437.89, "r_x1": 545.113, "r_y1": 437.89, "r_x2": 545.113, "r_y2": 429.338, "r_x3": 449.94, "r_y3": 429.338, "coord_origin": "TOPLEFT"}, "text": "and refines it through a", "orig": "and refines it through a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 449.845, "r_x1": 545.115, "r_y1": 449.845, "r_x2": 545.115, "r_y2": 441.293, "r_x3": 308.862, "r_y3": 441.293, "coord_origin": "TOPLEFT"}, "text": "multi-head dot-product attention layer, followed by a Feed", "orig": "multi-head dot-product attention layer, followed by a Feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 461.8, "r_x1": 384.149, "r_y1": 461.8, "r_x2": 384.149, "r_y2": 453.248, "r_x3": 308.862, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "Forward Network.", "orig": "Forward Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.375, "r_y0": 461.8, "r_x1": 459.616, "r_y1": 461.8, "r_x2": 459.616, "r_y2": 453.248, "r_x3": 393.375, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "During training,", "orig": "During training,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 464.667, "r_y0": 461.8, "r_x1": 476.841, "r_y1": 461.8, "r_x2": 476.841, "r_y2": 453.248, "r_x3": 464.667, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 481.374, "r_y0": 461.8, "r_x1": 527.85, "r_y1": 461.8, "r_x2": 527.85, "r_y2": 453.248, "r_x3": 481.374, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "transformer", "orig": "transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.393, "r_y0": 461.8, "r_x1": 545.115, "r_y1": 461.8, "r_x2": 545.115, "r_y2": 453.248, "r_x3": 532.393, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "de-", "orig": "de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 473.756, "r_x1": 545.115, "r_y1": 473.756, "r_x2": 545.115, "r_y2": 465.204, "r_x3": 308.862, "r_y3": 465.204, "coord_origin": "TOPLEFT"}, "text": "coder receives as input the output feature produced by the", "orig": "coder receives as input the output feature produced by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 485.711, "r_x1": 545.115, "r_y1": 485.711, "r_x2": 545.115, "r_y2": 477.159, "r_x3": 308.862, "r_y3": 477.159, "coord_origin": "TOPLEFT"}, "text": "transformer encoder, and the tokenized input of the HTML", "orig": "transformer encoder, and the tokenized input of the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 497.666, "r_x1": 545.115, "r_y1": 497.666, "r_x2": 545.115, "r_y2": 489.114, "r_x3": 308.862, "r_y3": 489.114, "coord_origin": "TOPLEFT"}, "text": "ground-truth tags. Using a stack of multi-head attention lay-", "orig": "ground-truth tags. Using a stack of multi-head attention lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 509.621, "r_x1": 545.115, "r_y1": 509.621, "r_x2": 545.115, "r_y2": 501.069, "r_x3": 308.862, "r_y3": 501.069, "coord_origin": "TOPLEFT"}, "text": "ers, different aspects of the tag sequence could be inferred.", "orig": "ers, different aspects of the tag sequence could be inferred.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 521.576, "r_x1": 545.115, "r_y1": 521.576, "r_x2": 545.115, "r_y2": 513.024, "r_x3": 308.862, "r_y3": 513.024, "coord_origin": "TOPLEFT"}, "text": "This is achieved by each attention head on a layer operating", "orig": "This is achieved by each attention head on a layer operating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.5319999999999, "r_x1": 545.115, "r_y1": 533.5319999999999, "r_x2": 545.115, "r_y2": 524.98, "r_x3": 308.862, "r_y3": 524.98, "coord_origin": "TOPLEFT"}, "text": "in a different subspace, and then combining altogether their", "orig": "in a different subspace, and then combining altogether their", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.487, "r_x1": 369.733, "r_y1": 545.487, "r_x2": 369.733, "r_y2": 536.935, "r_x3": 308.862, "r_y3": 536.935, "coord_origin": "TOPLEFT"}, "text": "attention score.", "orig": "attention score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 308.862, "t": 548.605, "r": 545.115, "b": 653.187, "coord_origin": "TOPLEFT"}, "confidence": 0.9869195818901062, "cells": [{"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 557.561, "r_x1": 404.762, "r_y1": 557.561, "r_x2": 404.762, "r_y2": 548.605, "r_x3": 320.817, "r_y3": 548.605, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder.", "orig": "Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.341, "r_y0": 557.545, "r_x1": 545.115, "r_y1": 557.545, "r_x2": 545.115, "r_y2": 548.9929999999999, "r_x3": 410.341, "r_y3": 548.9929999999999, "coord_origin": "TOPLEFT"}, "text": "Our architecture allows to simul-", "orig": "Our architecture allows to simul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.501, "r_x1": 545.115, "r_y1": 569.501, "r_x2": 545.115, "r_y2": 560.9490000000001, "r_x3": 308.862, "r_y3": 560.9490000000001, "coord_origin": "TOPLEFT"}, "text": "taneously predict HTML tags and bounding boxes for each", "orig": "taneously predict HTML tags and bounding boxes for each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 581.456, "r_x1": 545.115, "r_y1": 581.456, "r_x2": 545.115, "r_y2": 572.904, "r_x3": 308.862, "r_y3": 572.904, "coord_origin": "TOPLEFT"}, "text": "table cell without the need of a separate object detector end", "orig": "table cell without the need of a separate object detector end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 593.4110000000001, "r_x1": 336.458, "r_y1": 593.4110000000001, "r_x2": 336.458, "r_y2": 584.859, "r_x3": 308.862, "r_y3": 584.859, "coord_origin": "TOPLEFT"}, "text": "to end.", "orig": "to end.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.971, "r_y0": 593.4110000000001, "r_x1": 545.115, "r_y1": 593.4110000000001, "r_x2": 545.115, "r_y2": 584.859, "r_x3": 340.971, "r_y3": 584.859, "coord_origin": "TOPLEFT"}, "text": "This approach is inspired by DETR [1] which em-", "orig": "This approach is inspired by DETR [1] which em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.366, "r_x1": 545.115, "r_y1": 605.366, "r_x2": 545.115, "r_y2": 596.814, "r_x3": 308.862, "r_y3": 596.814, "coord_origin": "TOPLEFT"}, "text": "ploys a Transformer Encoder, and Decoder that looks for", "orig": "ploys a Transformer Encoder, and Decoder that looks for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.321, "r_x1": 545.115, "r_y1": 617.321, "r_x2": 545.115, "r_y2": 608.769, "r_x3": 308.862, "r_y3": 608.769, "coord_origin": "TOPLEFT"}, "text": "a specific number of object queries (potential object detec-", "orig": "a specific number of object queries (potential object detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.2760000000001, "r_x1": 545.115, "r_y1": 629.2760000000001, "r_x2": 545.115, "r_y2": 620.7239999999999, "r_x3": 308.862, "r_y3": 620.7239999999999, "coord_origin": "TOPLEFT"}, "text": "tions). As our model utilizes a transformer architecture, the", "orig": "tions). As our model utilizes a transformer architecture, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.232, "r_x1": 381.679, "r_y1": 641.232, "r_x2": 381.679, "r_y2": 632.6800000000001, "r_x3": 308.862, "r_y3": 632.6800000000001, "coord_origin": "TOPLEFT"}, "text": "hidden state of the", "orig": "hidden state of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.997, "r_y0": 641.068, "r_x1": 391.746, "r_y1": 641.068, "r_x2": 391.746, "r_y2": 632.362, "r_x3": 383.997, "r_y3": 632.362, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.746, "r_y0": 641.232, "r_x1": 399.497, "r_y1": 641.232, "r_x2": 399.497, "r_y2": 632.6800000000001, "r_x3": 391.746, "r_y3": 632.6800000000001, "coord_origin": "TOPLEFT"}, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 399.497, "r_y0": 641.068, "r_x1": 407.246, "r_y1": 641.068, "r_x2": 407.246, "r_y2": 632.362, "r_x3": 399.497, "r_y3": 632.362, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.246, "r_y0": 641.232, "r_x1": 432.91, "r_y1": 641.232, "r_x2": 432.91, "r_y2": 632.6800000000001, "r_x3": 407.246, "r_y3": 632.6800000000001, "coord_origin": "TOPLEFT"}, "text": "' and '", "orig": "' and '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 432.908, "r_y0": 641.068, "r_x1": 440.657, "r_y1": 641.068, "r_x2": 440.657, "r_y2": 632.362, "r_x3": 432.908, "r_y3": 632.362, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.657, "r_y0": 641.232, "r_x1": 545.115, "r_y1": 641.232, "r_x2": 545.115, "r_y2": 632.6800000000001, "r_x3": 440.657, "r_y3": 632.6800000000001, "coord_origin": "TOPLEFT"}, "text": "' HTMLstructure tags be-", "orig": "' HTMLstructure tags be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.187, "r_x1": 398.964, "r_y1": 653.187, "r_x2": 398.964, "r_y2": 644.635, "r_x3": 308.862, "r_y3": 644.635, "coord_origin": "TOPLEFT"}, "text": "come the object query.", "orig": "come the object query.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 308.862, "t": 656.515, "r": 545.115, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9852352142333984, "cells": [{"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 665.246, "r_x1": 444.343, "r_y1": 665.246, "r_x2": 444.343, "r_y2": 656.694, "r_x3": 320.817, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "The encoding generated by the", "orig": "The encoding generated by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 447.006, "r_y0": 665.103, "r_x1": 545.108, "r_y1": 665.103, "r_x2": 545.108, "r_y2": 656.515, "r_x3": 447.006, "r_y3": 656.515, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 308.862, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "along with the features acquired for every data cell from the", "orig": "along with the features acquired for every data cell from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 308.862, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "Transformer Decoder are then passed to the attention net-", "orig": "Transformer Decoder are then passed to the attention net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "work. The attention network takes both inputs and learns to", "orig": "work. The attention network takes both inputs and learns to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 203, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 470.425, "r_y1": 713.066, "r_x2": 470.425, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "provide an attention weighted encoding.", "orig": "provide an attention weighted encoding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 204, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 474.63, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 474.63, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "This weighted at-", "orig": "This weighted at-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8719564080238342, "cells": [{"index": 205, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "picture", "id": 7, "page_no": 4, "cluster": {"id": 7, "label": "picture", "bbox": {"l": 74.30525970458984, "t": 77.91120147705078, "r": 519.9801025390625, "b": 183.70150756835938, "coord_origin": "TOPLEFT"}, "confidence": 0.9296807646751404, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 125.61699999999996, "r_x1": 84.524, "r_y1": 125.61699999999996, "r_x2": 84.524, "r_y2": 122.481, "r_x3": 81.688, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 125.61699999999996, "r_x1": 93.026, "r_y1": 125.61699999999996, "r_x2": 93.026, "r_y2": 122.481, "r_x3": 86.413, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 102.505, "r_y0": 118.42999999999995, "r_x1": 115.346, "r_y1": 118.42999999999995, "r_x2": 115.346, "r_y2": 115.293, "r_x3": 102.505, "r_y3": 115.293, "coord_origin": "TOPLEFT"}, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.14, "r_y0": 118.39200000000005, "r_x1": 93.292, "r_y1": 118.39200000000005, "r_x2": 93.292, "r_y2": 115.25599999999997, "r_x3": 82.14, "r_y3": 115.25599999999997, "coord_origin": "TOPLEFT"}, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 125.61699999999996, "r_x1": 104.312, "r_y1": 125.61699999999996, "r_x2": 104.312, "r_y2": 122.481, "r_x3": 96.748, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 130.92100000000005, "r_x1": 102.421, "r_y1": 130.92100000000005, "r_x2": 102.421, "r_y2": 127.78499999999997, "r_x3": 96.748, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 136.63300000000004, "r_x1": 104.312, "r_y1": 136.63300000000004, "r_x2": 104.312, "r_y2": 133.49699999999996, "r_x3": 96.748, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 142.34500000000003, "r_x1": 102.421, "r_y1": 142.34500000000003, "r_x2": 102.421, "r_y2": 139.20899999999995, "r_x3": 96.748, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 125.61699999999996, "r_x1": 116.144, "r_y1": 125.61699999999996, "r_x2": 116.144, "r_y2": 122.481, "r_x3": 110.661, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 130.92100000000005, "r_x1": 116.144, "r_y1": 130.92100000000005, "r_x2": 116.144, "r_y2": 127.78499999999997, "r_x3": 110.661, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 136.63300000000004, "r_x1": 116.144, "r_y1": 136.63300000000004, "r_x2": 116.144, "r_y2": 133.49699999999996, "r_x3": 110.661, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 142.34500000000003, "r_x1": 116.144, "r_y1": 142.34500000000003, "r_x2": 116.144, "r_y2": 139.20899999999995, "r_x3": 110.661, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 130.92100000000005, "r_x1": 84.524, "r_y1": 130.92100000000005, "r_x2": 84.524, "r_y2": 127.78499999999997, "r_x3": 81.688, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 130.92100000000005, "r_x1": 93.026, "r_y1": 130.92100000000005, "r_x2": 93.026, "r_y2": 127.78499999999997, "r_x3": 86.413, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 136.63300000000004, "r_x1": 84.524, "r_y1": 136.63300000000004, "r_x2": 84.524, "r_y2": 133.49699999999996, "r_x3": 81.688, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 136.63300000000004, "r_x1": 93.026, "r_y1": 136.63300000000004, "r_x2": 93.026, "r_y2": 133.49699999999996, "r_x3": 86.413, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 142.34500000000003, "r_x1": 84.524, "r_y1": 142.34500000000003, "r_x2": 84.524, "r_y2": 139.20899999999995, "r_x3": 81.688, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 142.34500000000003, "r_x1": 93.026, "r_y1": 142.34500000000003, "r_x2": 93.026, "r_y2": 139.20899999999995, "r_x3": 86.413, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.084, "r_y0": 96.21699999999998, "r_x1": 113.936, "r_y1": 96.21699999999998, "r_x2": 113.936, "r_y2": 90.57100000000003, "r_x3": 88.084, "r_y3": 90.57100000000003, "coord_origin": "TOPLEFT"}, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.81, "r_y0": 103.35699999999997, "r_x1": 119.212, "r_y1": 103.35699999999997, "r_x2": 119.212, "r_y2": 97.71100000000001, "r_x3": 82.81, "r_y3": 97.71100000000001, "coord_origin": "TOPLEFT"}, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.942, "r_y0": 106.322, "r_x1": 180.011, "r_y1": 106.322, "r_x2": 180.011, "r_y2": 100.67600000000004, "r_x3": 143.942, "r_y3": 100.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.941, "r_y0": 113.46199999999999, "r_x1": 172.012, "r_y1": 113.46199999999999, "r_x2": 172.012, "r_y2": 107.81600000000003, "r_x3": 151.941, "r_y3": 107.81600000000003, "coord_origin": "TOPLEFT"}, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.769, "r_y0": 86.64999999999998, "r_x1": 266.396, "r_y1": 86.64999999999998, "r_x2": 266.396, "r_y2": 81.00400000000002, "r_x3": 251.769, "r_y3": 81.00400000000002, "coord_origin": "TOPLEFT"}, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.516, "r_y0": 91.75, "r_x1": 270.65, "r_y1": 91.75, "r_x2": 270.65, "r_y2": 86.10400000000004, "r_x3": 247.516, "r_y3": 86.10400000000004, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.037, "r_y0": 84.279, "r_x1": 352.126, "r_y1": 84.279, "r_x2": 352.126, "r_y2": 78.63300000000004, "r_x3": 331.037, "r_y3": 78.63300000000004, "coord_origin": "TOPLEFT"}, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.564, "r_y0": 101.75199999999995, "r_x1": 431.726, "r_y1": 101.75199999999995, "r_x2": 431.726, "r_y2": 96.106, "r_x3": 390.564, "r_y3": 96.106, "coord_origin": "TOPLEFT"}, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.824, "r_y0": 107.87199999999996, "r_x1": 435.47, "r_y1": 107.87199999999996, "r_x2": 435.47, "r_y2": 102.226, "r_x3": 386.824, "r_y3": 102.226, "coord_origin": "TOPLEFT"}, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 388.696, "r_y0": 113.99199999999996, "r_x1": 433.603, "r_y1": 113.99199999999996, "r_x2": 433.603, "r_y2": 108.346, "r_x3": 388.696, "r_y3": 108.346, "coord_origin": "TOPLEFT"}, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.078, "r_y0": 120.11199999999997, "r_x1": 431.225, "r_y1": 120.11199999999997, "r_x2": 431.225, "r_y2": 114.46600000000001, "r_x3": 391.078, "r_y3": 114.46600000000001, "coord_origin": "TOPLEFT"}, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.227, "r_y0": 157.40499999999997, "r_x1": 498.821, "r_y1": 157.40499999999997, "r_x2": 498.821, "r_y2": 151.75900000000001, "r_x3": 431.227, "r_y3": 151.75900000000001, "coord_origin": "TOPLEFT"}, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.174, "r_y0": 163.52499999999998, "r_x1": 498.878, "r_y1": 163.52499999999998, "r_x2": 498.878, "r_y2": 157.87900000000002, "r_x3": 431.174, "r_y3": 157.87900000000002, "coord_origin": "TOPLEFT"}, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.529, "r_y0": 169.64499999999998, "r_x1": 489.518, "r_y1": 169.64499999999998, "r_x2": 489.518, "r_y2": 163.99900000000002, "r_x3": 440.529, "r_y3": 163.99900000000002, "coord_origin": "TOPLEFT"}, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.375, "r_y0": 183.97299999999996, "r_x1": 367.723, "r_y1": 183.97299999999996, "r_x2": 367.723, "r_y2": 178.327, "r_x3": 328.375, "r_y3": 178.327, "coord_origin": "TOPLEFT"}, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.845, "r_y0": 129.62800000000004, "r_x1": 373.68, "r_y1": 129.62800000000004, "r_x2": 373.68, "r_y2": 123.98199999999997, "r_x3": 331.845, "r_y3": 123.98199999999997, "coord_origin": "TOPLEFT"}, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.845, "r_y0": 134.72799999999995, "r_x1": 381.178, "r_y1": 134.72799999999995, "r_x2": 381.178, "r_y2": 129.082, "r_x3": 331.845, "r_y3": 129.082, "coord_origin": "TOPLEFT"}, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.626, "r_y0": 93.83600000000001, "r_x1": 219.423, "r_y1": 93.83600000000001, "r_x2": 219.423, "r_y2": 88.19000000000005, "r_x3": 196.626, "r_y3": 88.19000000000005, "coord_origin": "TOPLEFT"}, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.668, "r_y0": 135.21400000000006, "r_x1": 271.499, "r_y1": 135.21400000000006, "r_x2": 271.499, "r_y2": 129.56799999999998, "r_x3": 246.668, "r_y3": 129.56799999999998, "coord_origin": "TOPLEFT"}, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.516, "r_y0": 140.31399999999996, "r_x1": 270.65, "r_y1": 140.31399999999996, "r_x2": 270.65, "r_y2": 134.668, "r_x3": 247.516, "r_y3": 134.668, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 94.73900000000003, "r_x1": 365.553, "r_y1": 94.73900000000003, "r_x2": 365.553, "r_y2": 89.09299999999996, "r_x3": 330.631, "r_y3": 89.09299999999996, "coord_origin": "TOPLEFT"}, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 102.899, "r_x1": 370.227, "r_y1": 102.899, "r_x2": 370.227, "r_y2": 97.25300000000004, "r_x3": 330.631, "r_y3": 97.25300000000004, "coord_origin": "TOPLEFT"}, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 111.05899999999997, "r_x1": 374.512, "r_y1": 111.05899999999997, "r_x2": 374.512, "r_y2": 105.41300000000001, "r_x3": 330.631, "r_y3": 105.41300000000001, "coord_origin": "TOPLEFT"}, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 119.21900000000005, "r_x1": 335.732, "r_y1": 119.21900000000005, "r_x2": 335.732, "r_y2": 113.57299999999998, "r_x3": 330.631, "r_y3": 113.57299999999998, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 146.558, "r_x1": 335.06, "r_y1": 146.558, "r_x2": 335.06, "r_y2": 141.85400000000004, "r_x3": 322.306, "r_y3": 141.85400000000004, "coord_origin": "TOPLEFT"}, "text": "<TR>", "orig": "<TR>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 153.69799999999998, "r_x1": 421.588, "r_y1": 153.69799999999998, "r_x2": 421.588, "r_y2": 148.99400000000003, "r_x3": 322.306, "r_y3": 148.99400000000003, "coord_origin": "TOPLEFT"}, "text": "<TD> 1 </TD><TD colspan=\"2\"> 2 </TD>", "orig": "<TD> 1 </TD><TD colspan=\"2\"> 2 </TD>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 160.83799999999997, "r_x1": 349.23, "r_y1": 160.83799999999997, "r_x2": 349.23, "r_y2": 156.13400000000001, "r_x3": 322.306, "r_y3": 156.13400000000001, "coord_origin": "TOPLEFT"}, "text": "</TR><TR>", "orig": "</TR><TR>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 167.97799999999995, "r_x1": 374.737, "r_y1": 167.97799999999995, "r_x2": 374.737, "r_y2": 163.274, "r_x3": 322.306, "r_y3": 163.274, "coord_origin": "TOPLEFT"}, "text": "<TD> 3 </TD><TD>...", "orig": "<TD> 3 </TD><TD>...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 175.11800000000005, "r_x1": 326.557, "r_y1": 175.11800000000005, "r_x2": 326.557, "r_y2": 170.414, "r_x3": 322.306, "r_y3": 170.414, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.511, "r_y0": 95.38900000000001, "r_x1": 326.914, "r_y1": 95.38900000000001, "r_x2": 326.914, "r_y2": 89.74300000000005, "r_x3": 323.511, "r_y3": 89.74300000000005, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.715, "r_y0": 103.50800000000004, "r_x1": 327.118, "r_y1": 103.50800000000004, "r_x2": 327.118, "r_y2": 97.86199999999997, "r_x3": 323.715, "r_y3": 97.86199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.715, "r_y0": 111.70899999999995, "r_x1": 327.118, "r_y1": 111.70899999999995, "r_x2": 327.118, "r_y2": 106.06299999999999, "r_x3": 323.715, "r_y3": 106.06299999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.464, "r_y0": 110.26499999999999, "r_x1": 457.867, "r_y1": 110.26499999999999, "r_x2": 457.867, "r_y2": 104.61900000000003, "r_x3": 454.464, "r_y3": 104.61900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.326, "r_y0": 96.81500000000005, "r_x1": 496.729, "r_y1": 96.81500000000005, "r_x2": 496.729, "r_y2": 91.16899999999998, "r_x3": 493.326, "r_y3": 91.16899999999998, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.083, "r_y0": 96.28800000000001, "r_x1": 457.486, "r_y1": 96.28800000000001, "r_x2": 457.486, "r_y2": 90.64200000000005, "r_x3": 454.083, "r_y3": 90.64200000000005, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 11, "label": "text", "bbox": {"l": 81.688, "t": 122.481, "r": 84.524, "b": 125.61699999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 125.61699999999996, "r_x1": 84.524, "r_y1": 125.61699999999996, "r_x2": 84.524, "r_y2": 122.481, "r_x3": 81.688, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "text", "bbox": {"l": 86.413, "t": 122.481, "r": 93.026, "b": 125.61699999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 125.61699999999996, "r_x1": 93.026, "r_y1": 125.61699999999996, "r_x2": 93.026, "r_y2": 122.481, "r_x3": 86.413, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "text", "bbox": {"l": 102.505, "t": 115.293, "r": 115.346, "b": 118.42999999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 102.505, "r_y0": 118.42999999999995, "r_x1": 115.346, "r_y1": 118.42999999999995, "r_x2": 115.346, "r_y2": 115.293, "r_x3": 102.505, "r_y3": 115.293, "coord_origin": "TOPLEFT"}, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "text", "bbox": {"l": 82.14, "t": 115.25599999999997, "r": 93.292, "b": 118.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.14, "r_y0": 118.39200000000005, "r_x1": 93.292, "r_y1": 118.39200000000005, "r_x2": 93.292, "r_y2": 115.25599999999997, "r_x3": 82.14, "r_y3": 115.25599999999997, "coord_origin": "TOPLEFT"}, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "text", "bbox": {"l": 96.748, "t": 122.481, "r": 104.312, "b": 125.61699999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 125.61699999999996, "r_x1": 104.312, "r_y1": 125.61699999999996, "r_x2": 104.312, "r_y2": 122.481, "r_x3": 96.748, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 96.748, "t": 127.78499999999997, "r": 102.421, "b": 130.92100000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 130.92100000000005, "r_x1": 102.421, "r_y1": 130.92100000000005, "r_x2": 102.421, "r_y2": 127.78499999999997, "r_x3": 96.748, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "text", "bbox": {"l": 96.748, "t": 133.49699999999996, "r": 104.312, "b": 136.63300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 136.63300000000004, "r_x1": 104.312, "r_y1": 136.63300000000004, "r_x2": 104.312, "r_y2": 133.49699999999996, "r_x3": 96.748, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 96.748, "t": 139.20899999999995, "r": 102.421, "b": 142.34500000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 142.34500000000003, "r_x1": 102.421, "r_y1": 142.34500000000003, "r_x2": 102.421, "r_y2": 139.20899999999995, "r_x3": 96.748, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 110.661, "t": 122.481, "r": 116.144, "b": 125.61699999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 125.61699999999996, "r_x1": 116.144, "r_y1": 125.61699999999996, "r_x2": 116.144, "r_y2": 122.481, "r_x3": 110.661, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 110.661, "t": 127.78499999999997, "r": 116.144, "b": 130.92100000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 130.92100000000005, "r_x1": 116.144, "r_y1": 130.92100000000005, "r_x2": 116.144, "r_y2": 127.78499999999997, "r_x3": 110.661, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 110.661, "t": 133.49699999999996, "r": 116.144, "b": 136.63300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 136.63300000000004, "r_x1": 116.144, "r_y1": 136.63300000000004, "r_x2": 116.144, "r_y2": 133.49699999999996, "r_x3": 110.661, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 110.661, "t": 139.20899999999995, "r": 116.144, "b": 142.34500000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 142.34500000000003, "r_x1": 116.144, "r_y1": 142.34500000000003, "r_x2": 116.144, "r_y2": 139.20899999999995, "r_x3": 110.661, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 81.688, "t": 127.78499999999997, "r": 84.524, "b": 130.92100000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 130.92100000000005, "r_x1": 84.524, "r_y1": 130.92100000000005, "r_x2": 84.524, "r_y2": 127.78499999999997, "r_x3": 81.688, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 86.413, "t": 127.78499999999997, "r": 93.026, "b": 130.92100000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 130.92100000000005, "r_x1": 93.026, "r_y1": 130.92100000000005, "r_x2": 93.026, "r_y2": 127.78499999999997, "r_x3": 86.413, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 81.688, "t": 133.49699999999996, "r": 84.524, "b": 136.63300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 136.63300000000004, "r_x1": 84.524, "r_y1": 136.63300000000004, "r_x2": 84.524, "r_y2": 133.49699999999996, "r_x3": 81.688, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 86.413, "t": 133.49699999999996, "r": 93.026, "b": 136.63300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 136.63300000000004, "r_x1": 93.026, "r_y1": 136.63300000000004, "r_x2": 93.026, "r_y2": 133.49699999999996, "r_x3": 86.413, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 81.688, "t": 139.20899999999995, "r": 84.524, "b": 142.34500000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 142.34500000000003, "r_x1": 84.524, "r_y1": 142.34500000000003, "r_x2": 84.524, "r_y2": 139.20899999999995, "r_x3": 81.688, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 86.413, "t": 139.20899999999995, "r": 93.026, "b": 142.34500000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 142.34500000000003, "r_x1": 93.026, "r_y1": 142.34500000000003, "r_x2": 93.026, "r_y2": 139.20899999999995, "r_x3": 86.413, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 88.084, "t": 90.57100000000003, "r": 113.936, "b": 96.21699999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.084, "r_y0": 96.21699999999998, "r_x1": 113.936, "r_y1": 96.21699999999998, "r_x2": 113.936, "r_y2": 90.57100000000003, "r_x3": 88.084, "r_y3": 90.57100000000003, "coord_origin": "TOPLEFT"}, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 82.81, "t": 97.71100000000001, "r": 119.212, "b": 103.35699999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.81, "r_y0": 103.35699999999997, "r_x1": 119.212, "r_y1": 103.35699999999997, "r_x2": 119.212, "r_y2": 97.71100000000001, "r_x3": 82.81, "r_y3": 97.71100000000001, "coord_origin": "TOPLEFT"}, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 143.942, "t": 100.67600000000004, "r": 180.011, "b": 106.322, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.942, "r_y0": 106.322, "r_x1": 180.011, "r_y1": 106.322, "r_x2": 180.011, "r_y2": 100.67600000000004, "r_x3": 143.942, "r_y3": 100.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 151.941, "t": 107.81600000000003, "r": 172.012, "b": 113.46199999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.941, "r_y0": 113.46199999999999, "r_x1": 172.012, "r_y1": 113.46199999999999, "r_x2": 172.012, "r_y2": 107.81600000000003, "r_x3": 151.941, "r_y3": 107.81600000000003, "coord_origin": "TOPLEFT"}, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 251.769, "t": 81.00400000000002, "r": 266.396, "b": 86.64999999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.769, "r_y0": 86.64999999999998, "r_x1": 266.396, "r_y1": 86.64999999999998, "r_x2": 266.396, "r_y2": 81.00400000000002, "r_x3": 251.769, "r_y3": 81.00400000000002, "coord_origin": "TOPLEFT"}, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 247.516, "t": 86.10400000000004, "r": 270.65, "b": 91.75, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.516, "r_y0": 91.75, "r_x1": 270.65, "r_y1": 91.75, "r_x2": 270.65, "r_y2": 86.10400000000004, "r_x3": 247.516, "r_y3": 86.10400000000004, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 331.037, "t": 78.63300000000004, "r": 352.126, "b": 84.279, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.037, "r_y0": 84.279, "r_x1": 352.126, "r_y1": 84.279, "r_x2": 352.126, "r_y2": 78.63300000000004, "r_x3": 331.037, "r_y3": 78.63300000000004, "coord_origin": "TOPLEFT"}, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 390.564, "t": 96.106, "r": 431.726, "b": 101.75199999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.564, "r_y0": 101.75199999999995, "r_x1": 431.726, "r_y1": 101.75199999999995, "r_x2": 431.726, "r_y2": 96.106, "r_x3": 390.564, "r_y3": 96.106, "coord_origin": "TOPLEFT"}, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 386.824, "t": 102.226, "r": 435.47, "b": 107.87199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.824, "r_y0": 107.87199999999996, "r_x1": 435.47, "r_y1": 107.87199999999996, "r_x2": 435.47, "r_y2": 102.226, "r_x3": 386.824, "r_y3": 102.226, "coord_origin": "TOPLEFT"}, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 388.696, "t": 108.346, "r": 433.603, "b": 113.99199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 388.696, "r_y0": 113.99199999999996, "r_x1": 433.603, "r_y1": 113.99199999999996, "r_x2": 433.603, "r_y2": 108.346, "r_x3": 388.696, "r_y3": 108.346, "coord_origin": "TOPLEFT"}, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 391.078, "t": 114.46600000000001, "r": 431.225, "b": 120.11199999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.078, "r_y0": 120.11199999999997, "r_x1": 431.225, "r_y1": 120.11199999999997, "r_x2": 431.225, "r_y2": 114.46600000000001, "r_x3": 391.078, "r_y3": 114.46600000000001, "coord_origin": "TOPLEFT"}, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 431.227, "t": 151.75900000000001, "r": 498.821, "b": 157.40499999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.227, "r_y0": 157.40499999999997, "r_x1": 498.821, "r_y1": 157.40499999999997, "r_x2": 498.821, "r_y2": 151.75900000000001, "r_x3": 431.227, "r_y3": 151.75900000000001, "coord_origin": "TOPLEFT"}, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 431.174, "t": 157.87900000000002, "r": 498.878, "b": 163.52499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.174, "r_y0": 163.52499999999998, "r_x1": 498.878, "r_y1": 163.52499999999998, "r_x2": 498.878, "r_y2": 157.87900000000002, "r_x3": 431.174, "r_y3": 157.87900000000002, "coord_origin": "TOPLEFT"}, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 440.529, "t": 163.99900000000002, "r": 489.518, "b": 169.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.529, "r_y0": 169.64499999999998, "r_x1": 489.518, "r_y1": 169.64499999999998, "r_x2": 489.518, "r_y2": 163.99900000000002, "r_x3": 440.529, "r_y3": 163.99900000000002, "coord_origin": "TOPLEFT"}, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 328.375, "t": 178.327, "r": 367.723, "b": 183.97299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.375, "r_y0": 183.97299999999996, "r_x1": 367.723, "r_y1": 183.97299999999996, "r_x2": 367.723, "r_y2": 178.327, "r_x3": 328.375, "r_y3": 178.327, "coord_origin": "TOPLEFT"}, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 331.845, "t": 123.98199999999997, "r": 373.68, "b": 129.62800000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.845, "r_y0": 129.62800000000004, "r_x1": 373.68, "r_y1": 129.62800000000004, "r_x2": 373.68, "r_y2": 123.98199999999997, "r_x3": 331.845, "r_y3": 123.98199999999997, "coord_origin": "TOPLEFT"}, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 331.845, "t": 129.082, "r": 381.178, "b": 134.72799999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.845, "r_y0": 134.72799999999995, "r_x1": 381.178, "r_y1": 134.72799999999995, "r_x2": 381.178, "r_y2": 129.082, "r_x3": 331.845, "r_y3": 129.082, "coord_origin": "TOPLEFT"}, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 196.626, "t": 88.19000000000005, "r": 219.423, "b": 93.83600000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.626, "r_y0": 93.83600000000001, "r_x1": 219.423, "r_y1": 93.83600000000001, "r_x2": 219.423, "r_y2": 88.19000000000005, "r_x3": 196.626, "r_y3": 88.19000000000005, "coord_origin": "TOPLEFT"}, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 246.668, "t": 129.56799999999998, "r": 271.499, "b": 135.21400000000006, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.668, "r_y0": 135.21400000000006, "r_x1": 271.499, "r_y1": 135.21400000000006, "r_x2": 271.499, "r_y2": 129.56799999999998, "r_x3": 246.668, "r_y3": 129.56799999999998, "coord_origin": "TOPLEFT"}, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 247.516, "t": 134.668, "r": 270.65, "b": 140.31399999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.516, "r_y0": 140.31399999999996, "r_x1": 270.65, "r_y1": 140.31399999999996, "r_x2": 270.65, "r_y2": 134.668, "r_x3": 247.516, "r_y3": 134.668, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 330.631, "t": 89.09299999999996, "r": 365.553, "b": 94.73900000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 94.73900000000003, "r_x1": 365.553, "r_y1": 94.73900000000003, "r_x2": 365.553, "r_y2": 89.09299999999996, "r_x3": 330.631, "r_y3": 89.09299999999996, "coord_origin": "TOPLEFT"}, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 330.631, "t": 97.25300000000004, "r": 370.227, "b": 102.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 102.899, "r_x1": 370.227, "r_y1": 102.899, "r_x2": 370.227, "r_y2": 97.25300000000004, "r_x3": 330.631, "r_y3": 97.25300000000004, "coord_origin": "TOPLEFT"}, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 330.631, "t": 105.41300000000001, "r": 374.512, "b": 111.05899999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 111.05899999999997, "r_x1": 374.512, "r_y1": 111.05899999999997, "r_x2": 374.512, "r_y2": 105.41300000000001, "r_x3": 330.631, "r_y3": 105.41300000000001, "coord_origin": "TOPLEFT"}, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 330.631, "t": 113.57299999999998, "r": 335.732, "b": 119.21900000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 119.21900000000005, "r_x1": 335.732, "r_y1": 119.21900000000005, "r_x2": 335.732, "r_y2": 113.57299999999998, "r_x3": 330.631, "r_y3": 113.57299999999998, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 322.306, "t": 141.85400000000004, "r": 335.06, "b": 146.558, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 146.558, "r_x1": 335.06, "r_y1": 146.558, "r_x2": 335.06, "r_y2": 141.85400000000004, "r_x3": 322.306, "r_y3": 141.85400000000004, "coord_origin": "TOPLEFT"}, "text": "<TR>", "orig": "<TR>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 322.306, "t": 148.99400000000003, "r": 421.588, "b": 153.69799999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 153.69799999999998, "r_x1": 421.588, "r_y1": 153.69799999999998, "r_x2": 421.588, "r_y2": 148.99400000000003, "r_x3": 322.306, "r_y3": 148.99400000000003, "coord_origin": "TOPLEFT"}, "text": "<TD> 1 </TD><TD colspan=\"2\"> 2 </TD>", "orig": "<TD> 1 </TD><TD colspan=\"2\"> 2 </TD>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 322.306, "t": 156.13400000000001, "r": 349.23, "b": 160.83799999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 160.83799999999997, "r_x1": 349.23, "r_y1": 160.83799999999997, "r_x2": 349.23, "r_y2": 156.13400000000001, "r_x3": 322.306, "r_y3": 156.13400000000001, "coord_origin": "TOPLEFT"}, "text": "</TR><TR>", "orig": "</TR><TR>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 322.306, "t": 163.274, "r": 374.737, "b": 167.97799999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 167.97799999999995, "r_x1": 374.737, "r_y1": 167.97799999999995, "r_x2": 374.737, "r_y2": 163.274, "r_x3": 322.306, "r_y3": 163.274, "coord_origin": "TOPLEFT"}, "text": "<TD> 3 </TD><TD>...", "orig": "<TD> 3 </TD><TD>...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 322.306, "t": 170.414, "r": 326.557, "b": 175.11800000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 175.11800000000005, "r_x1": 326.557, "r_y1": 175.11800000000005, "r_x2": 326.557, "r_y2": 170.414, "r_x3": 322.306, "r_y3": 170.414, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 323.511, "t": 89.74300000000005, "r": 326.914, "b": 95.38900000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.511, "r_y0": 95.38900000000001, "r_x1": 326.914, "r_y1": 95.38900000000001, "r_x2": 326.914, "r_y2": 89.74300000000005, "r_x3": 323.511, "r_y3": 89.74300000000005, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 323.715, "t": 97.86199999999997, "r": 327.118, "b": 103.50800000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.715, "r_y0": 103.50800000000004, "r_x1": 327.118, "r_y1": 103.50800000000004, "r_x2": 327.118, "r_y2": 97.86199999999997, "r_x3": 323.715, "r_y3": 97.86199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 323.715, "t": 106.06299999999999, "r": 327.118, "b": 111.70899999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.715, "r_y0": 111.70899999999995, "r_x1": 327.118, "r_y1": 111.70899999999995, "r_x2": 327.118, "r_y2": 106.06299999999999, "r_x3": 323.715, "r_y3": 106.06299999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 454.464, "t": 104.61900000000003, "r": 457.867, "b": 110.26499999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.464, "r_y0": 110.26499999999999, "r_x1": 457.867, "r_y1": 110.26499999999999, "r_x2": 457.867, "r_y2": 104.61900000000003, "r_x3": 454.464, "r_y3": 104.61900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 493.326, "t": 91.16899999999998, "r": 496.729, "b": 96.81500000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.326, "r_y0": 96.81500000000005, "r_x1": 496.729, "r_y1": 96.81500000000005, "r_x2": 496.729, "r_y2": 91.16899999999998, "r_x3": 493.326, "r_y3": 91.16899999999998, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 454.083, "t": 90.64200000000005, "r": 457.486, "b": 96.28800000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.083, "r_y0": 96.28800000000001, "r_x1": 457.486, "r_y1": 96.28800000000001, "r_x2": 457.486, "r_y2": 90.64200000000005, "r_x3": 454.083, "r_y3": 90.64200000000005, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "caption", "id": 6, "page_no": 4, "cluster": {"id": 6, "label": "caption", "bbox": {"l": 50.112, "t": 203.986, "r": 545.108, "b": 224.88099999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.9677652716636658, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 212.92600000000004, "r_x1": 86.884, "r_y1": 212.92600000000004, "r_x2": 86.884, "r_y2": 204.37400000000002, "r_x3": 50.112, "r_y3": 204.37400000000002, "coord_origin": "TOPLEFT"}, "text": "Figure 3:", "orig": "Figure 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.021, "r_y0": 212.942, "r_x1": 149.851, "r_y1": 212.942, "r_x2": 149.851, "r_y2": 203.986, "r_x3": 94.021, "r_y3": 203.986, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.861, "r_y0": 212.92600000000004, "r_x1": 545.108, "r_y1": 212.92600000000004, "r_x2": 545.108, "r_y2": 204.37400000000002, "r_x3": 152.861, "r_y3": 204.37400000000002, "coord_origin": "TOPLEFT"}, "text": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "orig": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 224.88099999999997, "r_x1": 436.013, "r_y1": 224.88099999999997, "r_x2": 436.013, "r_y2": 216.32899999999995, "r_x3": 50.112, "r_y3": 216.32899999999995, "coord_origin": "TOPLEFT"}, "text": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "orig": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 3: TableFormer takes in an image of the PDF and creates bounding box and HTML structure predictions that are synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure."}, {"label": "picture", "id": 5, "page_no": 4, "cluster": {"id": 5, "label": "picture", "bbox": {"l": 53.03328323364258, "t": 257.66534423828125, "r": 285.3731689453125, "b": 507.6688537597656, "coord_origin": "TOPLEFT"}, "confidence": 0.9724942445755005, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 74.253, "r_y0": 263.884, "r_x1": 101.758, "r_y1": 263.884, "r_x2": 101.758, "r_y2": 259.52, "r_x3": 74.253, "r_y3": 259.52, "coord_origin": "TOPLEFT"}, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.3, "r_y0": 264.015, "r_x1": 157.84, "r_y1": 264.015, "r_x2": 157.84, "r_y2": 259.65, "r_x3": 122.3, "r_y3": 259.65, "coord_origin": "TOPLEFT"}, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.549, "r_y0": 376.78, "r_x1": 125.684, "r_y1": 376.78, "r_x2": 125.684, "r_y2": 372.588, "r_x3": 78.549, "r_y3": 372.588, "coord_origin": "TOPLEFT"}, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.513, "r_y0": 396.713, "r_x1": 125.111, "r_y1": 396.713, "r_x2": 125.111, "r_y2": 392.52, "r_x3": 78.513, "r_y3": 392.52, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.025, "r_y0": 429.848, "r_x1": 127.923, "r_y1": 429.848, "r_x2": 127.923, "r_y2": 425.655, "r_x3": 76.025, "r_y3": 425.655, "coord_origin": "TOPLEFT"}, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.383, "r_y0": 450.284, "r_x1": 124.98, "r_y1": 450.284, "r_x2": 124.98, "r_y2": 446.091, "r_x3": 78.383, "r_y3": 446.091, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.469, "r_y0": 467.838, "r_x1": 181.629, "r_y1": 467.838, "r_x2": 181.629, "r_y2": 463.645, "r_x3": 167.469, "r_y3": 463.645, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 165.613, "r_y0": 483.866, "r_x1": 184.432, "r_y1": 483.866, "r_x2": 184.432, "r_y2": 479.673, "r_x3": 165.613, "r_y3": 479.673, "coord_origin": "TOPLEFT"}, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.32, "r_y0": 329.941, "r_x1": 132.925, "r_y1": 329.941, "r_x2": 132.925, "r_y2": 325.527, "r_x3": 65.32, "r_y3": 325.527, "coord_origin": "TOPLEFT"}, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.515, "r_y0": 274.491, "r_x1": 126.837, "r_y1": 274.491, "r_x2": 126.837, "r_y2": 270.73900000000003, "r_x3": 119.515, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "[30,", "orig": "[30,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.2, "r_y0": 274.491, "r_x1": 132.745, "r_y1": 274.491, "r_x2": 132.745, "r_y2": 270.73900000000003, "r_x3": 129.2, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "1,", "orig": "1,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 135.108, "r_y0": 274.491, "r_x1": 138.652, "r_y1": 274.491, "r_x2": 138.652, "r_y2": 270.73900000000003, "r_x3": 135.108, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "2,", "orig": "2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.015, "r_y0": 274.491, "r_x1": 144.56, "r_y1": 274.491, "r_x2": 144.56, "r_y2": 270.73900000000003, "r_x3": 141.015, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "3,", "orig": "3,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 146.923, "r_y0": 274.491, "r_x1": 160.625, "r_y1": 274.491, "r_x2": 160.625, "r_y2": 270.73900000000003, "r_x3": 146.923, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "4, \u20263,", "orig": "4, \u20263,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.729, "r_y0": 279.741, "r_x1": 132.273, "r_y1": 279.741, "r_x2": 132.273, "r_y2": 275.98900000000003, "r_x3": 128.729, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "4,", "orig": "4,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.636, "r_y0": 279.741, "r_x1": 138.181, "r_y1": 279.741, "r_x2": 138.181, "r_y2": 275.98900000000003, "r_x3": 134.636, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "5,", "orig": "5,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.544, "r_y0": 279.741, "r_x1": 151.411, "r_y1": 279.741, "r_x2": 151.411, "r_y2": 275.98900000000003, "r_x3": 140.544, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "8, 31]", "orig": "8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.434, "r_y0": 343.926, "r_x1": 79.019, "r_y1": 343.926, "r_x2": 79.019, "r_y2": 340.521, "r_x3": 60.434, "r_y3": 340.521, "coord_origin": "TOPLEFT"}, "text": "Positional", "orig": "Positional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.598, "r_y0": 348.352, "r_x1": 78.855, "r_y1": 348.352, "r_x2": 78.855, "r_y2": 344.948, "r_x3": 60.598, "r_y3": 344.948, "coord_origin": "TOPLEFT"}, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.829, "r_y0": 298.344, "r_x1": 153.414, "r_y1": 298.344, "r_x2": 153.414, "r_y2": 294.939, "r_x3": 134.829, "r_y3": 294.939, "coord_origin": "TOPLEFT"}, "text": "Positional", "orig": "Positional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.993, "r_y0": 302.77, "r_x1": 153.25, "r_y1": 302.77, "r_x2": 153.25, "r_y2": 299.365, "r_x3": 134.993, "r_y3": 299.365, "coord_origin": "TOPLEFT"}, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 350.753, "r_x1": 197.149, "r_y1": 350.753, "r_x2": 197.149, "r_y2": 346.56, "r_x3": 150.552, "r_y3": 346.56, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 399.818, "r_x1": 197.149, "r_y1": 399.818, "r_x2": 197.149, "r_y2": 395.625, "r_x3": 150.552, "r_y3": 395.625, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.185, "r_y0": 381.063, "r_x1": 197.32, "r_y1": 381.063, "r_x2": 197.32, "r_y2": 376.87, "r_x3": 150.185, "r_y3": 376.87, "coord_origin": "TOPLEFT"}, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 445.643, "r_x1": 197.149, "r_y1": 445.643, "r_x2": 197.149, "r_y2": 441.45, "r_x3": 150.552, "r_y3": 441.45, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.864, "r_y0": 427.488, "r_x1": 199.762, "r_y1": 427.488, "r_x2": 199.762, "r_y2": 423.295, "r_x3": 147.864, "r_y3": 423.295, "coord_origin": "TOPLEFT"}, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.566, "r_y0": 319.657, "r_x1": 255.725, "r_y1": 319.657, "r_x2": 255.725, "r_y2": 315.465, "r_x3": 241.566, "r_y3": 315.465, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.917, "r_y0": 366.759, "r_x1": 256.077, "r_y1": 366.759, "r_x2": 256.077, "r_y2": 362.567, "r_x3": 241.917, "r_y3": 362.567, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.054, "r_y0": 342.014, "r_x1": 269.393, "r_y1": 342.014, "r_x2": 269.393, "r_y2": 337.821, "r_x3": 228.054, "r_y3": 337.821, "coord_origin": "TOPLEFT"}, "text": "Attention Network", "orig": "Attention Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.446, "r_y0": 410.541, "r_x1": 238.739, "r_y1": 410.541, "r_x2": 238.739, "r_y2": 406.349, "r_x3": 228.446, "r_y3": 406.349, "coord_origin": "TOPLEFT"}, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.298, "r_y0": 410.598, "r_x1": 270.457, "r_y1": 410.598, "r_x2": 270.457, "r_y2": 406.405, "r_x3": 256.298, "r_y3": 406.405, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.545, "r_y0": 387.608, "r_x1": 258.089, "r_y1": 387.608, "r_x2": 258.089, "r_y2": 383.415, "r_x3": 239.545, "r_y3": 383.415, "coord_origin": "TOPLEFT"}, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 59.258, "r_y0": 449.783, "r_x1": 59.245, "r_y1": 384.871, "r_x2": 55.273, "r_y2": 384.872, "r_x3": 55.286, "r_y3": 449.784, "coord_origin": "TOPLEFT"}, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 59.058, "r_y0": 378.454, "r_x1": 59.055, "r_y1": 373.809, "r_x2": 55.345, "r_y2": 373.812, "r_x3": 55.348, "r_y3": 378.457, "coord_origin": "TOPLEFT"}, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.296, "r_y0": 490.108, "r_x1": 122.166, "r_y1": 490.098, "r_x2": 122.165, "r_y2": 485.687, "r_x3": 85.295, "r_y3": 485.697, "coord_origin": "TOPLEFT"}, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.666, "r_y0": 285.074, "r_x1": 265.321, "r_y1": 285.064, "r_x2": 265.32, "r_y2": 281.281, "r_x3": 229.665, "r_y3": 281.291, "coord_origin": "TOPLEFT"}, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.174, "r_y0": 505.871, "r_x1": 190.419, "r_y1": 505.862, "r_x2": 190.417, "r_y2": 501.45, "r_x3": 157.172, "r_y3": 501.459, "coord_origin": "TOPLEFT"}, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.816, "r_y0": 443.634, "r_x1": 269.396, "r_y1": 443.622, "r_x2": 269.395, "r_y2": 439.211, "r_x3": 227.815, "r_y3": 439.222, "coord_origin": "TOPLEFT"}, "text": "Bounding Boxes &", "orig": "Bounding Boxes &", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.703, "r_y0": 449.632, "r_x1": 263.513, "r_y1": 449.624, "r_x2": 263.511, "r_y2": 445.212, "r_x3": 233.701, "r_y3": 445.22, "coord_origin": "TOPLEFT"}, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.747, "r_y0": 298.506, "r_x1": 210.91, "r_y1": 298.506, "r_x2": 210.91, "r_y2": 294.534, "r_x3": 184.747, "r_y3": 294.534, "coord_origin": "TOPLEFT"}, "text": "Transformer", "orig": "Transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.912, "r_y0": 304.256, "r_x1": 216.744, "r_y1": 304.256, "r_x2": 216.744, "r_y2": 300.284, "r_x3": 178.912, "r_y3": 300.284, "coord_origin": "TOPLEFT"}, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.246, "r_y0": 287.601, "r_x1": 198.891, "r_y1": 287.601, "r_x2": 198.891, "r_y2": 283.891, "r_x3": 194.246, "r_y3": 283.891, "coord_origin": "TOPLEFT"}, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.456, "r_y0": 277.548, "r_x1": 276.471, "r_y1": 277.548, "r_x2": 276.471, "r_y2": 273.134, "r_x3": 221.456, "r_y3": 273.134, "coord_origin": "TOPLEFT"}, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.652, "r_y0": 328.837, "r_x1": 195.97, "r_y1": 328.837, "r_x2": 195.97, "r_y2": 324.644, "r_x3": 151.652, "r_y3": 324.644, "coord_origin": "TOPLEFT"}, "text": "Masked Multi-Head", "orig": "Masked Multi-Head", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.433, "r_y0": 334.837, "r_x1": 184.19, "r_y1": 334.837, "r_x2": 184.19, "r_y2": 330.644, "r_x3": 163.433, "r_y3": 330.644, "coord_origin": "TOPLEFT"}, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 64, "label": "text", "bbox": {"l": 74.253, "t": 259.52, "r": 101.758, "b": 263.884, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 74.253, "r_y0": 263.884, "r_x1": 101.758, "r_y1": 263.884, "r_x2": 101.758, "r_y2": 259.52, "r_x3": 74.253, "r_y3": 259.52, "coord_origin": "TOPLEFT"}, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 122.3, "t": 259.65, "r": 157.84, "b": 264.015, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.3, "r_y0": 264.015, "r_x1": 157.84, "r_y1": 264.015, "r_x2": 157.84, "r_y2": 259.65, "r_x3": 122.3, "r_y3": 259.65, "coord_origin": "TOPLEFT"}, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 78.549, "t": 372.588, "r": 125.684, "b": 376.78, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.549, "r_y0": 376.78, "r_x1": 125.684, "r_y1": 376.78, "r_x2": 125.684, "r_y2": 372.588, "r_x3": 78.549, "r_y3": 372.588, "coord_origin": "TOPLEFT"}, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 78.513, "t": 392.52, "r": 125.111, "b": 396.713, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.513, "r_y0": 396.713, "r_x1": 125.111, "r_y1": 396.713, "r_x2": 125.111, "r_y2": 392.52, "r_x3": 78.513, "r_y3": 392.52, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 76.025, "t": 425.655, "r": 127.923, "b": 429.848, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.025, "r_y0": 429.848, "r_x1": 127.923, "r_y1": 429.848, "r_x2": 127.923, "r_y2": 425.655, "r_x3": 76.025, "r_y3": 425.655, "coord_origin": "TOPLEFT"}, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 78.383, "t": 446.091, "r": 124.98, "b": 450.284, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.383, "r_y0": 450.284, "r_x1": 124.98, "r_y1": 450.284, "r_x2": 124.98, "r_y2": 446.091, "r_x3": 78.383, "r_y3": 446.091, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 167.469, "t": 463.645, "r": 181.629, "b": 467.838, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.469, "r_y0": 467.838, "r_x1": 181.629, "r_y1": 467.838, "r_x2": 181.629, "r_y2": 463.645, "r_x3": 167.469, "r_y3": 463.645, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 165.613, "t": 479.673, "r": 184.432, "b": 483.866, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 165.613, "r_y0": 483.866, "r_x1": 184.432, "r_y1": 483.866, "r_x2": 184.432, "r_y2": 479.673, "r_x3": 165.613, "r_y3": 479.673, "coord_origin": "TOPLEFT"}, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 65.32, "t": 325.527, "r": 132.925, "b": 329.941, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.32, "r_y0": 329.941, "r_x1": 132.925, "r_y1": 329.941, "r_x2": 132.925, "r_y2": 325.527, "r_x3": 65.32, "r_y3": 325.527, "coord_origin": "TOPLEFT"}, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 119.515, "t": 270.73900000000003, "r": 126.837, "b": 274.491, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.515, "r_y0": 274.491, "r_x1": 126.837, "r_y1": 274.491, "r_x2": 126.837, "r_y2": 270.73900000000003, "r_x3": 119.515, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "[30,", "orig": "[30,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 129.2, "t": 270.73900000000003, "r": 132.745, "b": 274.491, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.2, "r_y0": 274.491, "r_x1": 132.745, "r_y1": 274.491, "r_x2": 132.745, "r_y2": 270.73900000000003, "r_x3": 129.2, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "1,", "orig": "1,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 135.108, "t": 270.73900000000003, "r": 138.652, "b": 274.491, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 135.108, "r_y0": 274.491, "r_x1": 138.652, "r_y1": 274.491, "r_x2": 138.652, "r_y2": 270.73900000000003, "r_x3": 135.108, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "2,", "orig": "2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 141.015, "t": 270.73900000000003, "r": 144.56, "b": 274.491, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.015, "r_y0": 274.491, "r_x1": 144.56, "r_y1": 274.491, "r_x2": 144.56, "r_y2": 270.73900000000003, "r_x3": 141.015, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "3,", "orig": "3,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 146.923, "t": 270.73900000000003, "r": 160.625, "b": 274.491, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 146.923, "r_y0": 274.491, "r_x1": 160.625, "r_y1": 274.491, "r_x2": 160.625, "r_y2": 270.73900000000003, "r_x3": 146.923, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "4, \u20263,", "orig": "4, \u20263,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 128.729, "t": 275.98900000000003, "r": 132.273, "b": 279.741, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.729, "r_y0": 279.741, "r_x1": 132.273, "r_y1": 279.741, "r_x2": 132.273, "r_y2": 275.98900000000003, "r_x3": 128.729, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "4,", "orig": "4,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 134.636, "t": 275.98900000000003, "r": 138.181, "b": 279.741, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.636, "r_y0": 279.741, "r_x1": 138.181, "r_y1": 279.741, "r_x2": 138.181, "r_y2": 275.98900000000003, "r_x3": 134.636, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "5,", "orig": "5,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 140.544, "t": 275.98900000000003, "r": 151.411, "b": 279.741, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.544, "r_y0": 279.741, "r_x1": 151.411, "r_y1": 279.741, "r_x2": 151.411, "r_y2": 275.98900000000003, "r_x3": 140.544, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "8, 31]", "orig": "8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 60.434, "t": 340.521, "r": 79.019, "b": 343.926, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.434, "r_y0": 343.926, "r_x1": 79.019, "r_y1": 343.926, "r_x2": 79.019, "r_y2": 340.521, "r_x3": 60.434, "r_y3": 340.521, "coord_origin": "TOPLEFT"}, "text": "Positional", "orig": "Positional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 82, "label": "text", "bbox": {"l": 60.598, "t": 344.948, "r": 78.855, "b": 348.352, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.598, "r_y0": 348.352, "r_x1": 78.855, "r_y1": 348.352, "r_x2": 78.855, "r_y2": 344.948, "r_x3": 60.598, "r_y3": 344.948, "coord_origin": "TOPLEFT"}, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 83, "label": "text", "bbox": {"l": 134.829, "t": 294.939, "r": 153.414, "b": 298.344, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.829, "r_y0": 298.344, "r_x1": 153.414, "r_y1": 298.344, "r_x2": 153.414, "r_y2": 294.939, "r_x3": 134.829, "r_y3": 294.939, "coord_origin": "TOPLEFT"}, "text": "Positional", "orig": "Positional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 134.993, "t": 299.365, "r": 153.25, "b": 302.77, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.993, "r_y0": 302.77, "r_x1": 153.25, "r_y1": 302.77, "r_x2": 153.25, "r_y2": 299.365, "r_x3": 134.993, "r_y3": 299.365, "coord_origin": "TOPLEFT"}, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 150.552, "t": 346.56, "r": 197.149, "b": 350.753, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 350.753, "r_x1": 197.149, "r_y1": 350.753, "r_x2": 197.149, "r_y2": 346.56, "r_x3": 150.552, "r_y3": 346.56, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 86, "label": "text", "bbox": {"l": 150.552, "t": 395.625, "r": 197.149, "b": 399.818, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 399.818, "r_x1": 197.149, "r_y1": 399.818, "r_x2": 197.149, "r_y2": 395.625, "r_x3": 150.552, "r_y3": 395.625, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 150.185, "t": 376.87, "r": 197.32, "b": 381.063, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.185, "r_y0": 381.063, "r_x1": 197.32, "r_y1": 381.063, "r_x2": 197.32, "r_y2": 376.87, "r_x3": 150.185, "r_y3": 376.87, "coord_origin": "TOPLEFT"}, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 88, "label": "text", "bbox": {"l": 150.552, "t": 441.45, "r": 197.149, "b": 445.643, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 445.643, "r_x1": 197.149, "r_y1": 445.643, "r_x2": 197.149, "r_y2": 441.45, "r_x3": 150.552, "r_y3": 441.45, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 147.864, "t": 423.295, "r": 199.762, "b": 427.488, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.864, "r_y0": 427.488, "r_x1": 199.762, "r_y1": 427.488, "r_x2": 199.762, "r_y2": 423.295, "r_x3": 147.864, "r_y3": 423.295, "coord_origin": "TOPLEFT"}, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 241.566, "t": 315.465, "r": 255.725, "b": 319.657, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.566, "r_y0": 319.657, "r_x1": 255.725, "r_y1": 319.657, "r_x2": 255.725, "r_y2": 315.465, "r_x3": 241.566, "r_y3": 315.465, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 91, "label": "text", "bbox": {"l": 241.917, "t": 362.567, "r": 256.077, "b": 366.759, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.917, "r_y0": 366.759, "r_x1": 256.077, "r_y1": 366.759, "r_x2": 256.077, "r_y2": 362.567, "r_x3": 241.917, "r_y3": 362.567, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 92, "label": "text", "bbox": {"l": 228.054, "t": 337.821, "r": 269.393, "b": 342.014, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.054, "r_y0": 342.014, "r_x1": 269.393, "r_y1": 342.014, "r_x2": 269.393, "r_y2": 337.821, "r_x3": 228.054, "r_y3": 337.821, "coord_origin": "TOPLEFT"}, "text": "Attention Network", "orig": "Attention Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 93, "label": "text", "bbox": {"l": 228.446, "t": 406.349, "r": 238.739, "b": 410.541, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.446, "r_y0": 410.541, "r_x1": 238.739, "r_y1": 410.541, "r_x2": 238.739, "r_y2": 406.349, "r_x3": 228.446, "r_y3": 406.349, "coord_origin": "TOPLEFT"}, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 94, "label": "text", "bbox": {"l": 256.298, "t": 406.405, "r": 270.457, "b": 410.598, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.298, "r_y0": 410.598, "r_x1": 270.457, "r_y1": 410.598, "r_x2": 270.457, "r_y2": 406.405, "r_x3": 256.298, "r_y3": 406.405, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 95, "label": "text", "bbox": {"l": 239.545, "t": 383.415, "r": 258.089, "b": 387.608, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.545, "r_y0": 387.608, "r_x1": 258.089, "r_y1": 387.608, "r_x2": 258.089, "r_y2": 383.415, "r_x3": 239.545, "r_y3": 383.415, "coord_origin": "TOPLEFT"}, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 96, "label": "text", "bbox": {"l": 55.273, "t": 384.871, "r": 59.258, "b": 449.784, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 59.258, "r_y0": 449.783, "r_x1": 59.245, "r_y1": 384.871, "r_x2": 55.273, "r_y2": 384.872, "r_x3": 55.286, "r_y3": 449.784, "coord_origin": "TOPLEFT"}, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 97, "label": "text", "bbox": {"l": 55.345, "t": 373.809, "r": 59.058, "b": 378.457, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 59.058, "r_y0": 378.454, "r_x1": 59.055, "r_y1": 373.809, "r_x2": 55.345, "r_y2": 373.812, "r_x3": 55.348, "r_y3": 378.457, "coord_origin": "TOPLEFT"}, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 98, "label": "text", "bbox": {"l": 85.295, "t": 485.687, "r": 122.166, "b": 490.108, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.296, "r_y0": 490.108, "r_x1": 122.166, "r_y1": 490.098, "r_x2": 122.165, "r_y2": 485.687, "r_x3": 85.295, "r_y3": 485.697, "coord_origin": "TOPLEFT"}, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 99, "label": "text", "bbox": {"l": 229.665, "t": 281.281, "r": 265.321, "b": 285.074, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.666, "r_y0": 285.074, "r_x1": 265.321, "r_y1": 285.064, "r_x2": 265.32, "r_y2": 281.281, "r_x3": 229.665, "r_y3": 281.291, "coord_origin": "TOPLEFT"}, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 100, "label": "text", "bbox": {"l": 157.172, "t": 501.45, "r": 190.419, "b": 505.871, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.174, "r_y0": 505.871, "r_x1": 190.419, "r_y1": 505.862, "r_x2": 190.417, "r_y2": 501.45, "r_x3": 157.172, "r_y3": 501.459, "coord_origin": "TOPLEFT"}, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 101, "label": "text", "bbox": {"l": 227.815, "t": 439.211, "r": 269.396, "b": 443.634, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.816, "r_y0": 443.634, "r_x1": 269.396, "r_y1": 443.622, "r_x2": 269.395, "r_y2": 439.211, "r_x3": 227.815, "r_y3": 439.222, "coord_origin": "TOPLEFT"}, "text": "Bounding Boxes &", "orig": "Bounding Boxes &", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 102, "label": "text", "bbox": {"l": 233.701, "t": 445.212, "r": 263.513, "b": 449.632, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.703, "r_y0": 449.632, "r_x1": 263.513, "r_y1": 449.624, "r_x2": 263.511, "r_y2": 445.212, "r_x3": 233.701, "r_y3": 445.22, "coord_origin": "TOPLEFT"}, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 103, "label": "text", "bbox": {"l": 184.747, "t": 294.534, "r": 210.91, "b": 298.506, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.747, "r_y0": 298.506, "r_x1": 210.91, "r_y1": 298.506, "r_x2": 210.91, "r_y2": 294.534, "r_x3": 184.747, "r_y3": 294.534, "coord_origin": "TOPLEFT"}, "text": "Transformer", "orig": "Transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 104, "label": "text", "bbox": {"l": 178.912, "t": 300.284, "r": 216.744, "b": 304.256, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.912, "r_y0": 304.256, "r_x1": 216.744, "r_y1": 304.256, "r_x2": 216.744, "r_y2": 300.284, "r_x3": 178.912, "r_y3": 300.284, "coord_origin": "TOPLEFT"}, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 105, "label": "text", "bbox": {"l": 194.246, "t": 283.891, "r": 198.891, "b": 287.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.246, "r_y0": 287.601, "r_x1": 198.891, "r_y1": 287.601, "r_x2": 198.891, "r_y2": 283.891, "r_x3": 194.246, "r_y3": 283.891, "coord_origin": "TOPLEFT"}, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 106, "label": "text", "bbox": {"l": 221.456, "t": 273.134, "r": 276.471, "b": 277.548, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.456, "r_y0": 277.548, "r_x1": 276.471, "r_y1": 277.548, "r_x2": 276.471, "r_y2": 273.134, "r_x3": 221.456, "r_y3": 273.134, "coord_origin": "TOPLEFT"}, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 107, "label": "text", "bbox": {"l": 151.652, "t": 324.644, "r": 195.97, "b": 328.837, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.652, "r_y0": 328.837, "r_x1": 195.97, "r_y1": 328.837, "r_x2": 195.97, "r_y2": 324.644, "r_x3": 151.652, "r_y3": 324.644, "coord_origin": "TOPLEFT"}, "text": "Masked Multi-Head", "orig": "Masked Multi-Head", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 108, "label": "text", "bbox": {"l": 163.433, "t": 330.644, "r": 184.19, "b": 334.837, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.433, "r_y0": 334.837, "r_x1": 184.19, "r_y1": 334.837, "r_x2": 184.19, "r_y2": 330.644, "r_x3": 163.433, "r_y3": 330.644, "coord_origin": "TOPLEFT"}, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "caption", "id": 8, "page_no": 4, "cluster": {"id": 8, "label": "caption", "bbox": {"l": 50.112, "t": 527.783, "r": 286.366, "b": 680.185, "coord_origin": "TOPLEFT"}, "confidence": 0.8913407325744629, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 536.723, "r_x1": 85.878, "r_y1": 536.723, "r_x2": 85.878, "r_y2": 528.171, "r_x3": 50.112, "r_y3": 528.171, "coord_origin": "TOPLEFT"}, "text": "Figure 4:", "orig": "Figure 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 90.73, "r_y0": 536.723, "r_x1": 229.787, "r_y1": 536.723, "r_x2": 229.787, "r_y2": 528.171, "r_x3": 90.73, "r_y3": 528.171, "coord_origin": "TOPLEFT"}, "text": "Given an input image of a table, the", "orig": "Given an input image of a table, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 231.787, "r_y0": 536.739, "r_x1": 267.762, "r_y1": 536.739, "r_x2": 267.762, "r_y2": 527.783, "r_x3": 231.787, "r_y3": 527.783, "coord_origin": "TOPLEFT"}, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 269.764, "r_y0": 536.723, "r_x1": 286.362, "r_y1": 536.723, "r_x2": 286.362, "r_y2": 528.171, "r_x3": 269.764, "r_y3": 528.171, "coord_origin": "TOPLEFT"}, "text": "pro-", "orig": "pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 548.678, "r_x1": 286.365, "r_y1": 548.678, "r_x2": 286.365, "r_y2": 540.126, "r_x3": 50.112, "r_y3": 540.126, "coord_origin": "TOPLEFT"}, "text": "duces fixed-length features that represent the input image.", "orig": "duces fixed-length features that represent the input image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 560.634, "r_x1": 205.847, "r_y1": 560.634, "r_x2": 205.847, "r_y2": 552.082, "r_x3": 50.112, "r_y3": 552.082, "coord_origin": "TOPLEFT"}, "text": "The features are then passed to both the", "orig": "The features are then passed to both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.018, "r_y0": 560.65, "r_x1": 286.364, "r_y1": 560.65, "r_x2": 286.364, "r_y2": 551.694, "r_x3": 208.018, "r_y3": 551.694, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 572.5889999999999, "r_x1": 64.498, "r_y1": 572.5889999999999, "r_x2": 64.498, "r_y2": 564.037, "r_x3": 50.112, "r_y3": 564.037, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 68.165, "r_y0": 572.605, "r_x1": 151.313, "r_y1": 572.605, "r_x2": 151.313, "r_y2": 563.649, "r_x3": 68.165, "r_y3": 563.649, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.313, "r_y0": 572.5889999999999, "r_x1": 153.804, "r_y1": 572.5889999999999, "r_x2": 153.804, "r_y2": 564.037, "r_x3": 151.313, "r_y3": 564.037, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.419, "r_y0": 572.5889999999999, "r_x1": 241.933, "r_y1": 572.5889999999999, "r_x2": 241.933, "r_y2": 564.037, "r_x3": 160.419, "r_y3": 564.037, "coord_origin": "TOPLEFT"}, "text": "During training, the", "orig": "During training, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.595, "r_y0": 572.605, "r_x1": 286.362, "r_y1": 572.605, "r_x2": 286.362, "r_y2": 563.649, "r_x3": 245.595, "r_y3": 563.649, "coord_origin": "TOPLEFT"}, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 584.56, "r_x1": 85.519, "r_y1": 584.56, "r_x2": 85.519, "r_y2": 575.604, "r_x3": 50.112, "r_y3": 575.604, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.623, "r_y0": 584.544, "r_x1": 286.361, "r_y1": 584.544, "r_x2": 286.361, "r_y2": 575.992, "r_x3": 88.623, "r_y3": 575.992, "coord_origin": "TOPLEFT"}, "text": "receives 'tokenized tags' of the HTML code that", "orig": "receives 'tokenized tags' of the HTML code that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 596.499, "r_x1": 286.365, "r_y1": 596.499, "r_x2": 286.365, "r_y2": 587.947, "r_x3": 50.112, "r_y3": 587.947, "coord_origin": "TOPLEFT"}, "text": "represent the table structure. Afterwards, a transformer en-", "orig": "represent the table structure. Afterwards, a transformer en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 608.454, "r_x1": 286.365, "r_y1": 608.454, "r_x2": 286.365, "r_y2": 599.902, "r_x3": 50.112, "r_y3": 599.902, "coord_origin": "TOPLEFT"}, "text": "coder and decoder architecture is employed to produce fea-", "orig": "coder and decoder architecture is employed to produce fea-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 620.409, "r_x1": 240.438, "r_y1": 620.409, "r_x2": 240.438, "r_y2": 611.857, "r_x3": 50.112, "r_y3": 611.857, "coord_origin": "TOPLEFT"}, "text": "tures that are received by a linear layer, and the", "orig": "tures that are received by a linear layer, and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.198, "r_y0": 620.425, "r_x1": 286.366, "r_y1": 620.425, "r_x2": 286.366, "r_y2": 611.469, "r_x3": 243.198, "r_y3": 611.469, "coord_origin": "TOPLEFT"}, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 632.381, "r_x1": 87.013, "r_y1": 632.381, "r_x2": 87.013, "r_y2": 623.425, "r_x3": 50.112, "r_y3": 623.425, "coord_origin": "TOPLEFT"}, "text": "Decoder.", "orig": "Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.14, "r_y0": 632.381, "r_x1": 286.365, "r_y1": 632.381, "r_x2": 286.365, "r_y2": 623.425, "r_x3": 93.14, "r_y3": 623.425, "coord_origin": "TOPLEFT"}, "text": "The linear layer is applied to the features to", "orig": "The linear layer is applied to the features to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 644.336, "r_x1": 286.365, "r_y1": 644.336, "r_x2": 286.365, "r_y2": 635.38, "r_x3": 50.112, "r_y3": 635.38, "coord_origin": "TOPLEFT"}, "text": "predict the tags. Simultaneously, the Cell BBox Decoder", "orig": "predict the tags. Simultaneously, the Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 656.275, "r_x1": 220.582, "r_y1": 656.275, "r_x2": 220.582, "r_y2": 647.723, "r_x3": 50.112, "r_y3": 647.723, "coord_origin": "TOPLEFT"}, "text": "selects features referring to the data cells ('", "orig": "selects features referring to the data cells ('", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.578, "r_y0": 656.111, "r_x1": 228.327, "r_y1": 656.111, "r_x2": 228.327, "r_y2": 647.405, "r_x3": 220.578, "r_y3": 647.405, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.327, "r_y0": 656.275, "r_x1": 236.078, "r_y1": 656.275, "r_x2": 236.078, "r_y2": 647.723, "r_x3": 228.327, "r_y3": 647.723, "coord_origin": "TOPLEFT"}, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.078, "r_y0": 656.111, "r_x1": 243.827, "r_y1": 656.111, "r_x2": 243.827, "r_y2": 647.405, "r_x3": 236.078, "r_y3": 647.405, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.826, "r_y0": 656.275, "r_x1": 255.293, "r_y1": 656.275, "r_x2": 255.293, "r_y2": 647.723, "r_x3": 243.826, "r_y3": 647.723, "coord_origin": "TOPLEFT"}, "text": "', '", "orig": "', '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.291, "r_y0": 656.111, "r_x1": 263.04, "r_y1": 656.111, "r_x2": 263.04, "r_y2": 647.405, "r_x3": 255.291, "r_y3": 647.405, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.04, "r_y0": 656.275, "r_x1": 286.362, "r_y1": 656.275, "r_x2": 286.362, "r_y2": 647.723, "r_x3": 263.04, "r_y3": 647.723, "coord_origin": "TOPLEFT"}, "text": "') and", "orig": "') and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 668.23, "r_x1": 286.365, "r_y1": 668.23, "r_x2": 286.365, "r_y2": 659.678, "r_x3": 50.112, "r_y3": 659.678, "coord_origin": "TOPLEFT"}, "text": "passes them through an attention network, an MLP, and a", "orig": "passes them through an attention network, an MLP, and a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 680.185, "r_x1": 218.47, "r_y1": 680.185, "r_x2": 218.47, "r_y2": 671.633, "r_x3": 50.112, "r_y3": 671.633, "coord_origin": "TOPLEFT"}, "text": "linear layer to predict the bounding boxes.", "orig": "linear layer to predict the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 4: Given an input image of a table, the Encoder produces fixed-length features that represent the input image. The features are then passed to both the Structure Decoder and Cell BBox Decoder . During training, the Structure Decoder receives 'tokenized tags' of the HTML code that represent the table structure. Afterwards, a transformer encoder and decoder architecture is employed to produce features that are received by a linear layer, and the Cell BBox Decoder. The linear layer is applied to the features to predict the tags. Simultaneously, the Cell BBox Decoder selects features referring to the data cells (' < td > ', ' < ') and passes them through an attention network, an MLP, and a linear layer to predict the bounding boxes."}, {"label": "text", "id": 4, "page_no": 4, "cluster": {"id": 4, "label": "text", "bbox": {"l": 308.862, "t": 249.803, "r": 545.115, "b": 294.221, "coord_origin": "TOPLEFT"}, "confidence": 0.9831458330154419, "cells": [{"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.355, "r_x1": 545.115, "r_y1": 258.355, "r_x2": 545.115, "r_y2": 249.803, "r_x3": 308.862, "r_y3": 249.803, "coord_origin": "TOPLEFT"}, "text": "forming classification, and adding an adaptive pooling layer", "orig": "forming classification, and adding an adaptive pooling layer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 270.31100000000004, "r_x1": 366.466, "r_y1": 270.31100000000004, "r_x2": 366.466, "r_y2": 261.759, "r_x3": 308.862, "r_y3": 261.759, "coord_origin": "TOPLEFT"}, "text": "of size 28*28.", "orig": "of size 28*28.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 371.706, "r_y0": 270.31100000000004, "r_x1": 545.115, "r_y1": 270.31100000000004, "r_x2": 545.115, "r_y2": 261.759, "r_x3": 371.706, "r_y3": 261.759, "coord_origin": "TOPLEFT"}, "text": "ResNet by default downsamples the image", "orig": "ResNet by default downsamples the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 282.266, "r_x1": 545.115, "r_y1": 282.266, "r_x2": 545.115, "r_y2": 273.71400000000006, "r_x3": 308.862, "r_y3": 273.71400000000006, "coord_origin": "TOPLEFT"}, "text": "resolution by 32 and then the encoded image is provided to", "orig": "resolution by 32 and then the encoded image is provided to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 294.221, "r_x1": 341.24, "r_y1": 294.221, "r_x2": 341.24, "r_y2": 285.669, "r_x3": 308.862, "r_y3": 285.669, "coord_origin": "TOPLEFT"}, "text": "both the", "orig": "both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 343.731, "r_y0": 294.078, "r_x1": 417.235, "r_y1": 294.078, "r_x2": 417.235, "r_y2": 285.49, "r_x3": 343.731, "r_y3": 285.49, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.234, "r_y0": 294.221, "r_x1": 436.601, "r_y1": 294.221, "r_x2": 436.601, "r_y2": 285.669, "r_x3": 417.234, "r_y3": 285.669, "coord_origin": "TOPLEFT"}, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.092, "r_y0": 294.078, "r_x1": 516.561, "r_y1": 294.078, "r_x2": 516.561, "r_y2": 285.49, "r_x3": 439.092, "r_y3": 285.49, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.561, "r_y0": 294.221, "r_x1": 519.052, "r_y1": 294.221, "r_x2": 519.052, "r_y2": 285.669, "r_x3": 516.561, "r_y3": 285.669, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "forming classification, and adding an adaptive pooling layer of size 28*28. ResNet by default downsamples the image resolution by 32 and then the encoded image is provided to both the Structure Decoder , and Cell BBox Decoder ."}, {"label": "text", "id": 1, "page_no": 4, "cluster": {"id": 1, "label": "text", "bbox": {"l": 308.862, "t": 297.34, "r": 545.115, "b": 413.876, "coord_origin": "TOPLEFT"}, "confidence": 0.9862009882926941, "cells": [{"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 306.296, "r_x1": 400.866, "r_y1": 306.296, "r_x2": 400.866, "r_y2": 297.34, "r_x3": 320.817, "r_y3": 297.34, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder.", "orig": "Structure Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 403.914, "r_y0": 306.28, "r_x1": 545.114, "r_y1": 306.28, "r_x2": 545.114, "r_y2": 297.728, "r_x3": 403.914, "r_y3": 297.728, "coord_origin": "TOPLEFT"}, "text": "The transformer architecture of this", "orig": "The transformer architecture of this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 318.235, "r_x1": 517.529, "r_y1": 318.235, "r_x2": 517.529, "r_y2": 309.683, "r_x3": 308.862, "r_y3": 309.683, "coord_origin": "TOPLEFT"}, "text": "component is based on the work proposed in [31].", "orig": "component is based on the work proposed in [31].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 524.094, "r_y0": 318.235, "r_x1": 545.115, "r_y1": 318.235, "r_x2": 545.115, "r_y2": 309.683, "r_x3": 524.094, "r_y3": 309.683, "coord_origin": "TOPLEFT"}, "text": "After", "orig": "After", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 330.19, "r_x1": 432.358, "r_y1": 330.19, "r_x2": 432.358, "r_y2": 321.638, "r_x3": 308.862, "r_y3": 321.638, "coord_origin": "TOPLEFT"}, "text": "extensive experimentation, the", "orig": "extensive experimentation, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.82, "r_y0": 330.047, "r_x1": 510.29, "r_y1": 330.047, "r_x2": 510.29, "r_y2": 321.459, "r_x3": 435.82, "r_y3": 321.459, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.978, "r_y0": 330.19, "r_x1": 520.623, "r_y1": 330.19, "r_x2": 520.623, "r_y2": 321.638, "r_x3": 513.978, "r_y3": 321.638, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 524.08, "r_y0": 330.19, "r_x1": 545.111, "r_y1": 330.19, "r_x2": 545.111, "r_y2": 321.638, "r_x3": 524.08, "r_y3": 321.638, "coord_origin": "TOPLEFT"}, "text": "mod-", "orig": "mod-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 342.145, "r_x1": 545.115, "r_y1": 342.145, "r_x2": 545.115, "r_y2": 333.593, "r_x3": 308.862, "r_y3": 333.593, "coord_origin": "TOPLEFT"}, "text": "eled as a transformer encoder with two encoder layers and", "orig": "eled as a transformer encoder with two encoder layers and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 354.1, "r_x1": 545.115, "r_y1": 354.1, "r_x2": 545.115, "r_y2": 345.548, "r_x3": 308.862, "r_y3": 345.548, "coord_origin": "TOPLEFT"}, "text": "a transformer decoder made from a stack of 4 decoder lay-", "orig": "a transformer decoder made from a stack of 4 decoder lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 366.056, "r_x1": 545.115, "r_y1": 366.056, "r_x2": 545.115, "r_y2": 357.504, "r_x3": 308.862, "r_y3": 357.504, "coord_origin": "TOPLEFT"}, "text": "ers that comprise mainly of multi-head attention and feed", "orig": "ers that comprise mainly of multi-head attention and feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 378.011, "r_x1": 370.391, "r_y1": 378.011, "r_x2": 370.391, "r_y2": 369.459, "r_x3": 308.862, "r_y3": 369.459, "coord_origin": "TOPLEFT"}, "text": "forward layers.", "orig": "forward layers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.445, "r_y0": 378.011, "r_x1": 545.115, "r_y1": 378.011, "r_x2": 545.115, "r_y2": 369.459, "r_x3": 377.445, "r_y3": 369.459, "coord_origin": "TOPLEFT"}, "text": "This configuration uses fewer layers and", "orig": "This configuration uses fewer layers and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 389.966, "r_x1": 545.115, "r_y1": 389.966, "r_x2": 545.115, "r_y2": 381.414, "r_x3": 308.862, "r_y3": 381.414, "coord_origin": "TOPLEFT"}, "text": "heads in comparison to networks applied to other problems", "orig": "heads in comparison to networks applied to other problems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 401.921, "r_x1": 326.566, "r_y1": 401.921, "r_x2": 326.566, "r_y2": 393.369, "r_x3": 308.862, "r_y3": 393.369, "coord_origin": "TOPLEFT"}, "text": "(e.g.", "orig": "(e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.069, "r_y0": 401.921, "r_x1": 545.115, "r_y1": 401.921, "r_x2": 545.115, "r_y2": 393.369, "r_x3": 331.069, "r_y3": 393.369, "coord_origin": "TOPLEFT"}, "text": "'Scene Understanding', 'Image Captioning'), some-", "orig": "'Scene Understanding', 'Image Captioning'), some-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 413.876, "r_x1": 528.019, "r_y1": 413.876, "r_x2": 528.019, "r_y2": 405.324, "r_x3": 308.862, "r_y3": 405.324, "coord_origin": "TOPLEFT"}, "text": "thing which we relate to the simplicity of table images.", "orig": "thing which we relate to the simplicity of table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Structure Decoder. The transformer architecture of this component is based on the work proposed in [31]. After extensive experimentation, the Structure Decoder is modeled as a transformer encoder with two encoder layers and a transformer decoder made from a stack of 4 decoder layers that comprise mainly of multi-head attention and feed forward layers. This configuration uses fewer layers and heads in comparison to networks applied to other problems (e.g. 'Scene Understanding', 'Image Captioning'), something which we relate to the simplicity of table images."}, {"label": "text", "id": 3, "page_no": 4, "cluster": {"id": 3, "label": "text", "bbox": {"l": 308.862, "t": 417.383, "r": 545.115, "b": 545.487, "coord_origin": "TOPLEFT"}, "confidence": 0.9851906895637512, "cells": [{"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 425.935, "r_x1": 336.309, "r_y1": 425.935, "r_x2": 336.309, "r_y2": 417.383, "r_x3": 320.817, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.579, "r_y0": 425.935, "r_x1": 388.055, "r_y1": 425.935, "r_x2": 388.055, "r_y2": 417.383, "r_x3": 341.579, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "transformer", "orig": "transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.325, "r_y0": 425.935, "r_x1": 424.856, "r_y1": 425.935, "r_x2": 424.856, "r_y2": 417.383, "r_x3": 393.325, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "encoder", "orig": "encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.117, "r_y0": 425.935, "r_x1": 462.356, "r_y1": 425.935, "r_x2": 462.356, "r_y2": 417.383, "r_x3": 430.117, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "receives", "orig": "receives", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 467.626, "r_y0": 425.935, "r_x1": 477.031, "r_y1": 425.935, "r_x2": 477.031, "r_y2": 417.383, "r_x3": 467.626, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "an", "orig": "an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 482.301, "r_y0": 425.935, "r_x1": 515.496, "r_y1": 425.935, "r_x2": 515.496, "r_y2": 417.383, "r_x3": 482.301, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "encoded", "orig": "encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 520.766, "r_y0": 425.935, "r_x1": 545.115, "r_y1": 425.935, "r_x2": 545.115, "r_y2": 417.383, "r_x3": 520.766, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 437.89, "r_x1": 343.721, "r_y1": 437.89, "r_x2": 343.721, "r_y2": 429.338, "r_x3": 308.862, "r_y3": 429.338, "coord_origin": "TOPLEFT"}, "text": "from the", "orig": "from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.038, "r_y0": 437.747, "r_x1": 446.455, "r_y1": 437.747, "r_x2": 446.455, "r_y2": 429.159, "r_x3": 347.038, "r_y3": 429.159, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.94, "r_y0": 437.89, "r_x1": 545.113, "r_y1": 437.89, "r_x2": 545.113, "r_y2": 429.338, "r_x3": 449.94, "r_y3": 429.338, "coord_origin": "TOPLEFT"}, "text": "and refines it through a", "orig": "and refines it through a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 449.845, "r_x1": 545.115, "r_y1": 449.845, "r_x2": 545.115, "r_y2": 441.293, "r_x3": 308.862, "r_y3": 441.293, "coord_origin": "TOPLEFT"}, "text": "multi-head dot-product attention layer, followed by a Feed", "orig": "multi-head dot-product attention layer, followed by a Feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 461.8, "r_x1": 384.149, "r_y1": 461.8, "r_x2": 384.149, "r_y2": 453.248, "r_x3": 308.862, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "Forward Network.", "orig": "Forward Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.375, "r_y0": 461.8, "r_x1": 459.616, "r_y1": 461.8, "r_x2": 459.616, "r_y2": 453.248, "r_x3": 393.375, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "During training,", "orig": "During training,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 464.667, "r_y0": 461.8, "r_x1": 476.841, "r_y1": 461.8, "r_x2": 476.841, "r_y2": 453.248, "r_x3": 464.667, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 481.374, "r_y0": 461.8, "r_x1": 527.85, "r_y1": 461.8, "r_x2": 527.85, "r_y2": 453.248, "r_x3": 481.374, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "transformer", "orig": "transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.393, "r_y0": 461.8, "r_x1": 545.115, "r_y1": 461.8, "r_x2": 545.115, "r_y2": 453.248, "r_x3": 532.393, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "de-", "orig": "de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 473.756, "r_x1": 545.115, "r_y1": 473.756, "r_x2": 545.115, "r_y2": 465.204, "r_x3": 308.862, "r_y3": 465.204, "coord_origin": "TOPLEFT"}, "text": "coder receives as input the output feature produced by the", "orig": "coder receives as input the output feature produced by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 485.711, "r_x1": 545.115, "r_y1": 485.711, "r_x2": 545.115, "r_y2": 477.159, "r_x3": 308.862, "r_y3": 477.159, "coord_origin": "TOPLEFT"}, "text": "transformer encoder, and the tokenized input of the HTML", "orig": "transformer encoder, and the tokenized input of the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 497.666, "r_x1": 545.115, "r_y1": 497.666, "r_x2": 545.115, "r_y2": 489.114, "r_x3": 308.862, "r_y3": 489.114, "coord_origin": "TOPLEFT"}, "text": "ground-truth tags. Using a stack of multi-head attention lay-", "orig": "ground-truth tags. Using a stack of multi-head attention lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 509.621, "r_x1": 545.115, "r_y1": 509.621, "r_x2": 545.115, "r_y2": 501.069, "r_x3": 308.862, "r_y3": 501.069, "coord_origin": "TOPLEFT"}, "text": "ers, different aspects of the tag sequence could be inferred.", "orig": "ers, different aspects of the tag sequence could be inferred.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 521.576, "r_x1": 545.115, "r_y1": 521.576, "r_x2": 545.115, "r_y2": 513.024, "r_x3": 308.862, "r_y3": 513.024, "coord_origin": "TOPLEFT"}, "text": "This is achieved by each attention head on a layer operating", "orig": "This is achieved by each attention head on a layer operating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.5319999999999, "r_x1": 545.115, "r_y1": 533.5319999999999, "r_x2": 545.115, "r_y2": 524.98, "r_x3": 308.862, "r_y3": 524.98, "coord_origin": "TOPLEFT"}, "text": "in a different subspace, and then combining altogether their", "orig": "in a different subspace, and then combining altogether their", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.487, "r_x1": 369.733, "r_y1": 545.487, "r_x2": 369.733, "r_y2": 536.935, "r_x3": 308.862, "r_y3": 536.935, "coord_origin": "TOPLEFT"}, "text": "attention score.", "orig": "attention score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The transformer encoder receives an encoded image from the CNN Backbone Network and refines it through a multi-head dot-product attention layer, followed by a Feed Forward Network. During training, the transformer decoder receives as input the output feature produced by the transformer encoder, and the tokenized input of the HTML ground-truth tags. Using a stack of multi-head attention layers, different aspects of the tag sequence could be inferred. This is achieved by each attention head on a layer operating in a different subspace, and then combining altogether their attention score."}, {"label": "text", "id": 0, "page_no": 4, "cluster": {"id": 0, "label": "text", "bbox": {"l": 308.862, "t": 548.605, "r": 545.115, "b": 653.187, "coord_origin": "TOPLEFT"}, "confidence": 0.9869195818901062, "cells": [{"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 557.561, "r_x1": 404.762, "r_y1": 557.561, "r_x2": 404.762, "r_y2": 548.605, "r_x3": 320.817, "r_y3": 548.605, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder.", "orig": "Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.341, "r_y0": 557.545, "r_x1": 545.115, "r_y1": 557.545, "r_x2": 545.115, "r_y2": 548.9929999999999, "r_x3": 410.341, "r_y3": 548.9929999999999, "coord_origin": "TOPLEFT"}, "text": "Our architecture allows to simul-", "orig": "Our architecture allows to simul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.501, "r_x1": 545.115, "r_y1": 569.501, "r_x2": 545.115, "r_y2": 560.9490000000001, "r_x3": 308.862, "r_y3": 560.9490000000001, "coord_origin": "TOPLEFT"}, "text": "taneously predict HTML tags and bounding boxes for each", "orig": "taneously predict HTML tags and bounding boxes for each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 581.456, "r_x1": 545.115, "r_y1": 581.456, "r_x2": 545.115, "r_y2": 572.904, "r_x3": 308.862, "r_y3": 572.904, "coord_origin": "TOPLEFT"}, "text": "table cell without the need of a separate object detector end", "orig": "table cell without the need of a separate object detector end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 593.4110000000001, "r_x1": 336.458, "r_y1": 593.4110000000001, "r_x2": 336.458, "r_y2": 584.859, "r_x3": 308.862, "r_y3": 584.859, "coord_origin": "TOPLEFT"}, "text": "to end.", "orig": "to end.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.971, "r_y0": 593.4110000000001, "r_x1": 545.115, "r_y1": 593.4110000000001, "r_x2": 545.115, "r_y2": 584.859, "r_x3": 340.971, "r_y3": 584.859, "coord_origin": "TOPLEFT"}, "text": "This approach is inspired by DETR [1] which em-", "orig": "This approach is inspired by DETR [1] which em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.366, "r_x1": 545.115, "r_y1": 605.366, "r_x2": 545.115, "r_y2": 596.814, "r_x3": 308.862, "r_y3": 596.814, "coord_origin": "TOPLEFT"}, "text": "ploys a Transformer Encoder, and Decoder that looks for", "orig": "ploys a Transformer Encoder, and Decoder that looks for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.321, "r_x1": 545.115, "r_y1": 617.321, "r_x2": 545.115, "r_y2": 608.769, "r_x3": 308.862, "r_y3": 608.769, "coord_origin": "TOPLEFT"}, "text": "a specific number of object queries (potential object detec-", "orig": "a specific number of object queries (potential object detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.2760000000001, "r_x1": 545.115, "r_y1": 629.2760000000001, "r_x2": 545.115, "r_y2": 620.7239999999999, "r_x3": 308.862, "r_y3": 620.7239999999999, "coord_origin": "TOPLEFT"}, "text": "tions). As our model utilizes a transformer architecture, the", "orig": "tions). As our model utilizes a transformer architecture, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.232, "r_x1": 381.679, "r_y1": 641.232, "r_x2": 381.679, "r_y2": 632.6800000000001, "r_x3": 308.862, "r_y3": 632.6800000000001, "coord_origin": "TOPLEFT"}, "text": "hidden state of the", "orig": "hidden state of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.997, "r_y0": 641.068, "r_x1": 391.746, "r_y1": 641.068, "r_x2": 391.746, "r_y2": 632.362, "r_x3": 383.997, "r_y3": 632.362, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.746, "r_y0": 641.232, "r_x1": 399.497, "r_y1": 641.232, "r_x2": 399.497, "r_y2": 632.6800000000001, "r_x3": 391.746, "r_y3": 632.6800000000001, "coord_origin": "TOPLEFT"}, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 399.497, "r_y0": 641.068, "r_x1": 407.246, "r_y1": 641.068, "r_x2": 407.246, "r_y2": 632.362, "r_x3": 399.497, "r_y3": 632.362, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.246, "r_y0": 641.232, "r_x1": 432.91, "r_y1": 641.232, "r_x2": 432.91, "r_y2": 632.6800000000001, "r_x3": 407.246, "r_y3": 632.6800000000001, "coord_origin": "TOPLEFT"}, "text": "' and '", "orig": "' and '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 432.908, "r_y0": 641.068, "r_x1": 440.657, "r_y1": 641.068, "r_x2": 440.657, "r_y2": 632.362, "r_x3": 432.908, "r_y3": 632.362, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.657, "r_y0": 641.232, "r_x1": 545.115, "r_y1": 641.232, "r_x2": 545.115, "r_y2": 632.6800000000001, "r_x3": 440.657, "r_y3": 632.6800000000001, "coord_origin": "TOPLEFT"}, "text": "' HTMLstructure tags be-", "orig": "' HTMLstructure tags be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.187, "r_x1": 398.964, "r_y1": 653.187, "r_x2": 398.964, "r_y2": 644.635, "r_x3": 308.862, "r_y3": 644.635, "coord_origin": "TOPLEFT"}, "text": "come the object query.", "orig": "come the object query.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Cell BBox Decoder. Our architecture allows to simultaneously predict HTML tags and bounding boxes for each table cell without the need of a separate object detector end to end. This approach is inspired by DETR [1] which employs a Transformer Encoder, and Decoder that looks for a specific number of object queries (potential object detections). As our model utilizes a transformer architecture, the hidden state of the < td > ' and ' < ' HTMLstructure tags become the object query."}, {"label": "text", "id": 2, "page_no": 4, "cluster": {"id": 2, "label": "text", "bbox": {"l": 308.862, "t": 656.515, "r": 545.115, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9852352142333984, "cells": [{"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 665.246, "r_x1": 444.343, "r_y1": 665.246, "r_x2": 444.343, "r_y2": 656.694, "r_x3": 320.817, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "The encoding generated by the", "orig": "The encoding generated by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 447.006, "r_y0": 665.103, "r_x1": 545.108, "r_y1": 665.103, "r_x2": 545.108, "r_y2": 656.515, "r_x3": 447.006, "r_y3": 656.515, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 308.862, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "along with the features acquired for every data cell from the", "orig": "along with the features acquired for every data cell from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 308.862, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "Transformer Decoder are then passed to the attention net-", "orig": "Transformer Decoder are then passed to the attention net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "work. The attention network takes both inputs and learns to", "orig": "work. The attention network takes both inputs and learns to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 203, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 470.425, "r_y1": 713.066, "r_x2": 470.425, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "provide an attention weighted encoding.", "orig": "provide an attention weighted encoding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 204, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 474.63, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 474.63, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "This weighted at-", "orig": "This weighted at-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The encoding generated by the CNN Backbone Network along with the features acquired for every data cell from the Transformer Decoder are then passed to the attention network. The attention network takes both inputs and learns to provide an attention weighted encoding. This weighted at-"}, {"label": "page_footer", "id": 9, "page_no": 4, "cluster": {"id": 9, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8719564080238342, "cells": [{"index": 205, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5"}], "body": [{"label": "picture", "id": 7, "page_no": 4, "cluster": {"id": 7, "label": "picture", "bbox": {"l": 74.30525970458984, "t": 77.91120147705078, "r": 519.9801025390625, "b": 183.70150756835938, "coord_origin": "TOPLEFT"}, "confidence": 0.9296807646751404, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 125.61699999999996, "r_x1": 84.524, "r_y1": 125.61699999999996, "r_x2": 84.524, "r_y2": 122.481, "r_x3": 81.688, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 125.61699999999996, "r_x1": 93.026, "r_y1": 125.61699999999996, "r_x2": 93.026, "r_y2": 122.481, "r_x3": 86.413, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 102.505, "r_y0": 118.42999999999995, "r_x1": 115.346, "r_y1": 118.42999999999995, "r_x2": 115.346, "r_y2": 115.293, "r_x3": 102.505, "r_y3": 115.293, "coord_origin": "TOPLEFT"}, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.14, "r_y0": 118.39200000000005, "r_x1": 93.292, "r_y1": 118.39200000000005, "r_x2": 93.292, "r_y2": 115.25599999999997, "r_x3": 82.14, "r_y3": 115.25599999999997, "coord_origin": "TOPLEFT"}, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 125.61699999999996, "r_x1": 104.312, "r_y1": 125.61699999999996, "r_x2": 104.312, "r_y2": 122.481, "r_x3": 96.748, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 130.92100000000005, "r_x1": 102.421, "r_y1": 130.92100000000005, "r_x2": 102.421, "r_y2": 127.78499999999997, "r_x3": 96.748, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 136.63300000000004, "r_x1": 104.312, "r_y1": 136.63300000000004, "r_x2": 104.312, "r_y2": 133.49699999999996, "r_x3": 96.748, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 142.34500000000003, "r_x1": 102.421, "r_y1": 142.34500000000003, "r_x2": 102.421, "r_y2": 139.20899999999995, "r_x3": 96.748, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 125.61699999999996, "r_x1": 116.144, "r_y1": 125.61699999999996, "r_x2": 116.144, "r_y2": 122.481, "r_x3": 110.661, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 130.92100000000005, "r_x1": 116.144, "r_y1": 130.92100000000005, "r_x2": 116.144, "r_y2": 127.78499999999997, "r_x3": 110.661, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 136.63300000000004, "r_x1": 116.144, "r_y1": 136.63300000000004, "r_x2": 116.144, "r_y2": 133.49699999999996, "r_x3": 110.661, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 142.34500000000003, "r_x1": 116.144, "r_y1": 142.34500000000003, "r_x2": 116.144, "r_y2": 139.20899999999995, "r_x3": 110.661, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 130.92100000000005, "r_x1": 84.524, "r_y1": 130.92100000000005, "r_x2": 84.524, "r_y2": 127.78499999999997, "r_x3": 81.688, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 130.92100000000005, "r_x1": 93.026, "r_y1": 130.92100000000005, "r_x2": 93.026, "r_y2": 127.78499999999997, "r_x3": 86.413, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 136.63300000000004, "r_x1": 84.524, "r_y1": 136.63300000000004, "r_x2": 84.524, "r_y2": 133.49699999999996, "r_x3": 81.688, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 136.63300000000004, "r_x1": 93.026, "r_y1": 136.63300000000004, "r_x2": 93.026, "r_y2": 133.49699999999996, "r_x3": 86.413, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 142.34500000000003, "r_x1": 84.524, "r_y1": 142.34500000000003, "r_x2": 84.524, "r_y2": 139.20899999999995, "r_x3": 81.688, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 142.34500000000003, "r_x1": 93.026, "r_y1": 142.34500000000003, "r_x2": 93.026, "r_y2": 139.20899999999995, "r_x3": 86.413, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.084, "r_y0": 96.21699999999998, "r_x1": 113.936, "r_y1": 96.21699999999998, "r_x2": 113.936, "r_y2": 90.57100000000003, "r_x3": 88.084, "r_y3": 90.57100000000003, "coord_origin": "TOPLEFT"}, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.81, "r_y0": 103.35699999999997, "r_x1": 119.212, "r_y1": 103.35699999999997, "r_x2": 119.212, "r_y2": 97.71100000000001, "r_x3": 82.81, "r_y3": 97.71100000000001, "coord_origin": "TOPLEFT"}, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.942, "r_y0": 106.322, "r_x1": 180.011, "r_y1": 106.322, "r_x2": 180.011, "r_y2": 100.67600000000004, "r_x3": 143.942, "r_y3": 100.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.941, "r_y0": 113.46199999999999, "r_x1": 172.012, "r_y1": 113.46199999999999, "r_x2": 172.012, "r_y2": 107.81600000000003, "r_x3": 151.941, "r_y3": 107.81600000000003, "coord_origin": "TOPLEFT"}, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.769, "r_y0": 86.64999999999998, "r_x1": 266.396, "r_y1": 86.64999999999998, "r_x2": 266.396, "r_y2": 81.00400000000002, "r_x3": 251.769, "r_y3": 81.00400000000002, "coord_origin": "TOPLEFT"}, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.516, "r_y0": 91.75, "r_x1": 270.65, "r_y1": 91.75, "r_x2": 270.65, "r_y2": 86.10400000000004, "r_x3": 247.516, "r_y3": 86.10400000000004, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.037, "r_y0": 84.279, "r_x1": 352.126, "r_y1": 84.279, "r_x2": 352.126, "r_y2": 78.63300000000004, "r_x3": 331.037, "r_y3": 78.63300000000004, "coord_origin": "TOPLEFT"}, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.564, "r_y0": 101.75199999999995, "r_x1": 431.726, "r_y1": 101.75199999999995, "r_x2": 431.726, "r_y2": 96.106, "r_x3": 390.564, "r_y3": 96.106, "coord_origin": "TOPLEFT"}, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.824, "r_y0": 107.87199999999996, "r_x1": 435.47, "r_y1": 107.87199999999996, "r_x2": 435.47, "r_y2": 102.226, "r_x3": 386.824, "r_y3": 102.226, "coord_origin": "TOPLEFT"}, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 388.696, "r_y0": 113.99199999999996, "r_x1": 433.603, "r_y1": 113.99199999999996, "r_x2": 433.603, "r_y2": 108.346, "r_x3": 388.696, "r_y3": 108.346, "coord_origin": "TOPLEFT"}, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.078, "r_y0": 120.11199999999997, "r_x1": 431.225, "r_y1": 120.11199999999997, "r_x2": 431.225, "r_y2": 114.46600000000001, "r_x3": 391.078, "r_y3": 114.46600000000001, "coord_origin": "TOPLEFT"}, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.227, "r_y0": 157.40499999999997, "r_x1": 498.821, "r_y1": 157.40499999999997, "r_x2": 498.821, "r_y2": 151.75900000000001, "r_x3": 431.227, "r_y3": 151.75900000000001, "coord_origin": "TOPLEFT"}, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.174, "r_y0": 163.52499999999998, "r_x1": 498.878, "r_y1": 163.52499999999998, "r_x2": 498.878, "r_y2": 157.87900000000002, "r_x3": 431.174, "r_y3": 157.87900000000002, "coord_origin": "TOPLEFT"}, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.529, "r_y0": 169.64499999999998, "r_x1": 489.518, "r_y1": 169.64499999999998, "r_x2": 489.518, "r_y2": 163.99900000000002, "r_x3": 440.529, "r_y3": 163.99900000000002, "coord_origin": "TOPLEFT"}, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.375, "r_y0": 183.97299999999996, "r_x1": 367.723, "r_y1": 183.97299999999996, "r_x2": 367.723, "r_y2": 178.327, "r_x3": 328.375, "r_y3": 178.327, "coord_origin": "TOPLEFT"}, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.845, "r_y0": 129.62800000000004, "r_x1": 373.68, "r_y1": 129.62800000000004, "r_x2": 373.68, "r_y2": 123.98199999999997, "r_x3": 331.845, "r_y3": 123.98199999999997, "coord_origin": "TOPLEFT"}, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.845, "r_y0": 134.72799999999995, "r_x1": 381.178, "r_y1": 134.72799999999995, "r_x2": 381.178, "r_y2": 129.082, "r_x3": 331.845, "r_y3": 129.082, "coord_origin": "TOPLEFT"}, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.626, "r_y0": 93.83600000000001, "r_x1": 219.423, "r_y1": 93.83600000000001, "r_x2": 219.423, "r_y2": 88.19000000000005, "r_x3": 196.626, "r_y3": 88.19000000000005, "coord_origin": "TOPLEFT"}, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.668, "r_y0": 135.21400000000006, "r_x1": 271.499, "r_y1": 135.21400000000006, "r_x2": 271.499, "r_y2": 129.56799999999998, "r_x3": 246.668, "r_y3": 129.56799999999998, "coord_origin": "TOPLEFT"}, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.516, "r_y0": 140.31399999999996, "r_x1": 270.65, "r_y1": 140.31399999999996, "r_x2": 270.65, "r_y2": 134.668, "r_x3": 247.516, "r_y3": 134.668, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 94.73900000000003, "r_x1": 365.553, "r_y1": 94.73900000000003, "r_x2": 365.553, "r_y2": 89.09299999999996, "r_x3": 330.631, "r_y3": 89.09299999999996, "coord_origin": "TOPLEFT"}, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 102.899, "r_x1": 370.227, "r_y1": 102.899, "r_x2": 370.227, "r_y2": 97.25300000000004, "r_x3": 330.631, "r_y3": 97.25300000000004, "coord_origin": "TOPLEFT"}, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 111.05899999999997, "r_x1": 374.512, "r_y1": 111.05899999999997, "r_x2": 374.512, "r_y2": 105.41300000000001, "r_x3": 330.631, "r_y3": 105.41300000000001, "coord_origin": "TOPLEFT"}, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 119.21900000000005, "r_x1": 335.732, "r_y1": 119.21900000000005, "r_x2": 335.732, "r_y2": 113.57299999999998, "r_x3": 330.631, "r_y3": 113.57299999999998, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 146.558, "r_x1": 335.06, "r_y1": 146.558, "r_x2": 335.06, "r_y2": 141.85400000000004, "r_x3": 322.306, "r_y3": 141.85400000000004, "coord_origin": "TOPLEFT"}, "text": "<TR>", "orig": "<TR>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 153.69799999999998, "r_x1": 421.588, "r_y1": 153.69799999999998, "r_x2": 421.588, "r_y2": 148.99400000000003, "r_x3": 322.306, "r_y3": 148.99400000000003, "coord_origin": "TOPLEFT"}, "text": "<TD> 1 </TD><TD colspan=\"2\"> 2 </TD>", "orig": "<TD> 1 </TD><TD colspan=\"2\"> 2 </TD>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 160.83799999999997, "r_x1": 349.23, "r_y1": 160.83799999999997, "r_x2": 349.23, "r_y2": 156.13400000000001, "r_x3": 322.306, "r_y3": 156.13400000000001, "coord_origin": "TOPLEFT"}, "text": "</TR><TR>", "orig": "</TR><TR>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 167.97799999999995, "r_x1": 374.737, "r_y1": 167.97799999999995, "r_x2": 374.737, "r_y2": 163.274, "r_x3": 322.306, "r_y3": 163.274, "coord_origin": "TOPLEFT"}, "text": "<TD> 3 </TD><TD>...", "orig": "<TD> 3 </TD><TD>...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 175.11800000000005, "r_x1": 326.557, "r_y1": 175.11800000000005, "r_x2": 326.557, "r_y2": 170.414, "r_x3": 322.306, "r_y3": 170.414, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.511, "r_y0": 95.38900000000001, "r_x1": 326.914, "r_y1": 95.38900000000001, "r_x2": 326.914, "r_y2": 89.74300000000005, "r_x3": 323.511, "r_y3": 89.74300000000005, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.715, "r_y0": 103.50800000000004, "r_x1": 327.118, "r_y1": 103.50800000000004, "r_x2": 327.118, "r_y2": 97.86199999999997, "r_x3": 323.715, "r_y3": 97.86199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.715, "r_y0": 111.70899999999995, "r_x1": 327.118, "r_y1": 111.70899999999995, "r_x2": 327.118, "r_y2": 106.06299999999999, "r_x3": 323.715, "r_y3": 106.06299999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.464, "r_y0": 110.26499999999999, "r_x1": 457.867, "r_y1": 110.26499999999999, "r_x2": 457.867, "r_y2": 104.61900000000003, "r_x3": 454.464, "r_y3": 104.61900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.326, "r_y0": 96.81500000000005, "r_x1": 496.729, "r_y1": 96.81500000000005, "r_x2": 496.729, "r_y2": 91.16899999999998, "r_x3": 493.326, "r_y3": 91.16899999999998, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.083, "r_y0": 96.28800000000001, "r_x1": 457.486, "r_y1": 96.28800000000001, "r_x2": 457.486, "r_y2": 90.64200000000005, "r_x3": 454.083, "r_y3": 90.64200000000005, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 11, "label": "text", "bbox": {"l": 81.688, "t": 122.481, "r": 84.524, "b": 125.61699999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 125.61699999999996, "r_x1": 84.524, "r_y1": 125.61699999999996, "r_x2": 84.524, "r_y2": 122.481, "r_x3": 81.688, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "text", "bbox": {"l": 86.413, "t": 122.481, "r": 93.026, "b": 125.61699999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 125.61699999999996, "r_x1": 93.026, "r_y1": 125.61699999999996, "r_x2": 93.026, "r_y2": 122.481, "r_x3": 86.413, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "text", "bbox": {"l": 102.505, "t": 115.293, "r": 115.346, "b": 118.42999999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 102.505, "r_y0": 118.42999999999995, "r_x1": 115.346, "r_y1": 118.42999999999995, "r_x2": 115.346, "r_y2": 115.293, "r_x3": 102.505, "r_y3": 115.293, "coord_origin": "TOPLEFT"}, "text": "Amount", "orig": "Amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "text", "bbox": {"l": 82.14, "t": 115.25599999999997, "r": 93.292, "b": 118.39200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.14, "r_y0": 118.39200000000005, "r_x1": 93.292, "r_y1": 118.39200000000005, "r_x2": 93.292, "r_y2": 115.25599999999997, "r_x3": 82.14, "r_y3": 115.25599999999997, "coord_origin": "TOPLEFT"}, "text": "Names", "orig": "Names", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "text", "bbox": {"l": 96.748, "t": 122.481, "r": 104.312, "b": 125.61699999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 125.61699999999996, "r_x1": 104.312, "r_y1": 125.61699999999996, "r_x2": 104.312, "r_y2": 122.481, "r_x3": 96.748, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "1000", "orig": "1000", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 96.748, "t": 127.78499999999997, "r": 102.421, "b": 130.92100000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 130.92100000000005, "r_x1": 102.421, "r_y1": 130.92100000000005, "r_x2": 102.421, "r_y2": 127.78499999999997, "r_x3": 96.748, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "500", "orig": "500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "text", "bbox": {"l": 96.748, "t": 133.49699999999996, "r": 104.312, "b": 136.63300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 136.63300000000004, "r_x1": 104.312, "r_y1": 136.63300000000004, "r_x2": 104.312, "r_y2": 133.49699999999996, "r_x3": 96.748, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "3500", "orig": "3500", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "text", "bbox": {"l": 96.748, "t": 139.20899999999995, "r": 102.421, "b": 142.34500000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.748, "r_y0": 142.34500000000003, "r_x1": 102.421, "r_y1": 142.34500000000003, "r_x2": 102.421, "r_y2": 139.20899999999995, "r_x3": 96.748, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 110.661, "t": 122.481, "r": 116.144, "b": 125.61699999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 125.61699999999996, "r_x1": 116.144, "r_y1": 125.61699999999996, "r_x2": 116.144, "r_y2": 122.481, "r_x3": 110.661, "r_y3": 122.481, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "text", "bbox": {"l": 110.661, "t": 127.78499999999997, "r": 116.144, "b": 130.92100000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 130.92100000000005, "r_x1": 116.144, "r_y1": 130.92100000000005, "r_x2": 116.144, "r_y2": 127.78499999999997, "r_x3": 110.661, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "text", "bbox": {"l": 110.661, "t": 133.49699999999996, "r": 116.144, "b": 136.63300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 136.63300000000004, "r_x1": 116.144, "r_y1": 136.63300000000004, "r_x2": 116.144, "r_y2": 133.49699999999996, "r_x3": 110.661, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "text", "bbox": {"l": 110.661, "t": 139.20899999999995, "r": 116.144, "b": 142.34500000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.661, "r_y0": 142.34500000000003, "r_x1": 116.144, "r_y1": 142.34500000000003, "r_x2": 116.144, "r_y2": 139.20899999999995, "r_x3": 110.661, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "unit", "orig": "unit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "text", "bbox": {"l": 81.688, "t": 127.78499999999997, "r": 84.524, "b": 130.92100000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 130.92100000000005, "r_x1": 84.524, "r_y1": 130.92100000000005, "r_x2": 84.524, "r_y2": 127.78499999999997, "r_x3": 81.688, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "text", "bbox": {"l": 86.413, "t": 127.78499999999997, "r": 93.026, "b": 130.92100000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 130.92100000000005, "r_x1": 93.026, "r_y1": 130.92100000000005, "r_x2": 93.026, "r_y2": 127.78499999999997, "r_x3": 86.413, "r_y3": 127.78499999999997, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "text", "bbox": {"l": 81.688, "t": 133.49699999999996, "r": 84.524, "b": 136.63300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 136.63300000000004, "r_x1": 84.524, "r_y1": 136.63300000000004, "r_x2": 84.524, "r_y2": 133.49699999999996, "r_x3": 81.688, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 26, "label": "text", "bbox": {"l": 86.413, "t": 133.49699999999996, "r": 93.026, "b": 136.63300000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 136.63300000000004, "r_x1": 93.026, "r_y1": 136.63300000000004, "r_x2": 93.026, "r_y2": 133.49699999999996, "r_x3": 86.413, "r_y3": 133.49699999999996, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 27, "label": "text", "bbox": {"l": 81.688, "t": 139.20899999999995, "r": 84.524, "b": 142.34500000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.688, "r_y0": 142.34500000000003, "r_x1": 84.524, "r_y1": 142.34500000000003, "r_x2": 84.524, "r_y2": 139.20899999999995, "r_x3": 81.688, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 86.413, "t": 139.20899999999995, "r": 93.026, "b": 142.34500000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.413, "r_y0": 142.34500000000003, "r_x1": 93.026, "r_y1": 142.34500000000003, "r_x2": 93.026, "r_y2": 139.20899999999995, "r_x3": 86.413, "r_y3": 139.20899999999995, "coord_origin": "TOPLEFT"}, "text": "Item", "orig": "Item", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 88.084, "t": 90.57100000000003, "r": 113.936, "b": 96.21699999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.084, "r_y0": 96.21699999999998, "r_x1": 113.936, "r_y1": 96.21699999999998, "r_x2": 113.936, "r_y2": 90.57100000000003, "r_x3": 88.084, "r_y3": 90.57100000000003, "coord_origin": "TOPLEFT"}, "text": "Extracted", "orig": "Extracted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 82.81, "t": 97.71100000000001, "r": 119.212, "b": 103.35699999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.81, "r_y0": 103.35699999999997, "r_x1": 119.212, "r_y1": 103.35699999999997, "r_x2": 119.212, "r_y2": 97.71100000000001, "r_x3": 82.81, "r_y3": 97.71100000000001, "coord_origin": "TOPLEFT"}, "text": "Table Images", "orig": "Table Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 143.942, "t": 100.67600000000004, "r": 180.011, "b": 106.322, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.942, "r_y0": 106.322, "r_x1": 180.011, "r_y1": 106.322, "r_x2": 180.011, "r_y2": 100.67600000000004, "r_x3": 143.942, "r_y3": 100.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Standardized", "orig": "Standardized", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 151.941, "t": 107.81600000000003, "r": 172.012, "b": 113.46199999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.941, "r_y0": 113.46199999999999, "r_x1": 172.012, "r_y1": 113.46199999999999, "r_x2": 172.012, "r_y2": 107.81600000000003, "r_x3": 151.941, "r_y3": 107.81600000000003, "coord_origin": "TOPLEFT"}, "text": "Images", "orig": "Images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 251.769, "t": 81.00400000000002, "r": 266.396, "b": 86.64999999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.769, "r_y0": 86.64999999999998, "r_x1": 266.396, "r_y1": 86.64999999999998, "r_x2": 266.396, "r_y2": 81.00400000000002, "r_x3": 251.769, "r_y3": 81.00400000000002, "coord_origin": "TOPLEFT"}, "text": "BBox", "orig": "BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 247.516, "t": 86.10400000000004, "r": 270.65, "b": 91.75, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.516, "r_y0": 91.75, "r_x1": 270.65, "r_y1": 91.75, "r_x2": 270.65, "r_y2": 86.10400000000004, "r_x3": 247.516, "r_y3": 86.10400000000004, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 331.037, "t": 78.63300000000004, "r": 352.126, "b": 84.279, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.037, "r_y0": 84.279, "r_x1": 352.126, "r_y1": 84.279, "r_x2": 352.126, "r_y2": 78.63300000000004, "r_x3": 331.037, "r_y3": 78.63300000000004, "coord_origin": "TOPLEFT"}, "text": "BBoxes", "orig": "BBoxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 390.564, "t": 96.106, "r": 431.726, "b": 101.75199999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 390.564, "r_y0": 101.75199999999995, "r_x1": 431.726, "r_y1": 101.75199999999995, "r_x2": 431.726, "r_y2": 96.106, "r_x3": 390.564, "r_y3": 96.106, "coord_origin": "TOPLEFT"}, "text": "BBoxes can be", "orig": "BBoxes can be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 386.824, "t": 102.226, "r": 435.47, "b": 107.87199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.824, "r_y0": 107.87199999999996, "r_x1": 435.47, "r_y1": 107.87199999999996, "r_x2": 435.47, "r_y2": 102.226, "r_x3": 386.824, "r_y3": 102.226, "coord_origin": "TOPLEFT"}, "text": "traced back to the", "orig": "traced back to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 388.696, "t": 108.346, "r": 433.603, "b": 113.99199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 388.696, "r_y0": 113.99199999999996, "r_x1": 433.603, "r_y1": 113.99199999999996, "r_x2": 433.603, "r_y2": 108.346, "r_x3": 388.696, "r_y3": 108.346, "coord_origin": "TOPLEFT"}, "text": "original image to", "orig": "original image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 391.078, "t": 114.46600000000001, "r": 431.225, "b": 120.11199999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.078, "r_y0": 120.11199999999997, "r_x1": 431.225, "r_y1": 120.11199999999997, "r_x2": 431.225, "r_y2": 114.46600000000001, "r_x3": 391.078, "r_y3": 114.46600000000001, "coord_origin": "TOPLEFT"}, "text": "extract content", "orig": "extract content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 431.227, "t": 151.75900000000001, "r": 498.821, "b": 157.40499999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.227, "r_y0": 157.40499999999997, "r_x1": 498.821, "r_y1": 157.40499999999997, "r_x2": 498.821, "r_y2": 151.75900000000001, "r_x3": 431.227, "r_y3": 151.75900000000001, "coord_origin": "TOPLEFT"}, "text": "Structure Tags sequence", "orig": "Structure Tags sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 431.174, "t": 157.87900000000002, "r": 498.878, "b": 163.52499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.174, "r_y0": 163.52499999999998, "r_x1": 498.878, "r_y1": 163.52499999999998, "r_x2": 498.878, "r_y2": 157.87900000000002, "r_x3": 431.174, "r_y3": 157.87900000000002, "coord_origin": "TOPLEFT"}, "text": "provide full description of", "orig": "provide full description of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 440.529, "t": 163.99900000000002, "r": 489.518, "b": 169.64499999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.529, "r_y0": 169.64499999999998, "r_x1": 489.518, "r_y1": 169.64499999999998, "r_x2": 489.518, "r_y2": 163.99900000000002, "r_x3": 440.529, "r_y3": 163.99900000000002, "coord_origin": "TOPLEFT"}, "text": "the table structure", "orig": "the table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 328.375, "t": 178.327, "r": 367.723, "b": 183.97299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.375, "r_y0": 183.97299999999996, "r_x1": 367.723, "r_y1": 183.97299999999996, "r_x2": 367.723, "r_y2": 178.327, "r_x3": 328.375, "r_y3": 178.327, "coord_origin": "TOPLEFT"}, "text": "Structure Tags", "orig": "Structure Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 331.845, "t": 123.98199999999997, "r": 373.68, "b": 129.62800000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.845, "r_y0": 129.62800000000004, "r_x1": 373.68, "r_y1": 129.62800000000004, "r_x2": 373.68, "r_y2": 123.98199999999997, "r_x3": 331.845, "r_y3": 123.98199999999997, "coord_origin": "TOPLEFT"}, "text": "BBoxes in sync", "orig": "BBoxes in sync", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 331.845, "t": 129.082, "r": 381.178, "b": 134.72799999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.845, "r_y0": 134.72799999999995, "r_x1": 381.178, "r_y1": 134.72799999999995, "r_x2": 381.178, "r_y2": 129.082, "r_x3": 331.845, "r_y3": 129.082, "coord_origin": "TOPLEFT"}, "text": "with tag sequence", "orig": "with tag sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 196.626, "t": 88.19000000000005, "r": 219.423, "b": 93.83600000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 196.626, "r_y0": 93.83600000000001, "r_x1": 219.423, "r_y1": 93.83600000000001, "r_x2": 219.423, "r_y2": 88.19000000000005, "r_x3": 196.626, "r_y3": 88.19000000000005, "coord_origin": "TOPLEFT"}, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 246.668, "t": 129.56799999999998, "r": 271.499, "b": 135.21400000000006, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.668, "r_y0": 135.21400000000006, "r_x1": 271.499, "r_y1": 135.21400000000006, "r_x2": 271.499, "r_y2": 129.56799999999998, "r_x3": 246.668, "r_y3": 129.56799999999998, "coord_origin": "TOPLEFT"}, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 247.516, "t": 134.668, "r": 270.65, "b": 140.31399999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 247.516, "r_y0": 140.31399999999996, "r_x1": 270.65, "r_y1": 140.31399999999996, "r_x2": 270.65, "r_y2": 134.668, "r_x3": 247.516, "r_y3": 134.668, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 330.631, "t": 89.09299999999996, "r": 365.553, "b": 94.73900000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 94.73900000000003, "r_x1": 365.553, "r_y1": 94.73900000000003, "r_x2": 365.553, "r_y2": 89.09299999999996, "r_x3": 330.631, "r_y3": 89.09299999999996, "coord_origin": "TOPLEFT"}, "text": "[x1, y2, x2, y2]", "orig": "[x1, y2, x2, y2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 330.631, "t": 97.25300000000004, "r": 370.227, "b": 102.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 102.899, "r_x1": 370.227, "r_y1": 102.899, "r_x2": 370.227, "r_y2": 97.25300000000004, "r_x3": 330.631, "r_y3": 97.25300000000004, "coord_origin": "TOPLEFT"}, "text": "[x1', y2', x2', y2']", "orig": "[x1', y2', x2', y2']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 330.631, "t": 105.41300000000001, "r": 374.512, "b": 111.05899999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 111.05899999999997, "r_x1": 374.512, "r_y1": 111.05899999999997, "r_x2": 374.512, "r_y2": 105.41300000000001, "r_x3": 330.631, "r_y3": 105.41300000000001, "coord_origin": "TOPLEFT"}, "text": "[x1'', y2'', x2'', y2'']", "orig": "[x1'', y2'', x2'', y2'']", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 330.631, "t": 113.57299999999998, "r": 335.732, "b": 119.21900000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.631, "r_y0": 119.21900000000005, "r_x1": 335.732, "r_y1": 119.21900000000005, "r_x2": 335.732, "r_y2": 113.57299999999998, "r_x3": 330.631, "r_y3": 113.57299999999998, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 322.306, "t": 141.85400000000004, "r": 335.06, "b": 146.558, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 146.558, "r_x1": 335.06, "r_y1": 146.558, "r_x2": 335.06, "r_y2": 141.85400000000004, "r_x3": 322.306, "r_y3": 141.85400000000004, "coord_origin": "TOPLEFT"}, "text": "<TR>", "orig": "<TR>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 322.306, "t": 148.99400000000003, "r": 421.588, "b": 153.69799999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 153.69799999999998, "r_x1": 421.588, "r_y1": 153.69799999999998, "r_x2": 421.588, "r_y2": 148.99400000000003, "r_x3": 322.306, "r_y3": 148.99400000000003, "coord_origin": "TOPLEFT"}, "text": "<TD> 1 </TD><TD colspan=\"2\"> 2 </TD>", "orig": "<TD> 1 </TD><TD colspan=\"2\"> 2 </TD>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 322.306, "t": 156.13400000000001, "r": 349.23, "b": 160.83799999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 160.83799999999997, "r_x1": 349.23, "r_y1": 160.83799999999997, "r_x2": 349.23, "r_y2": 156.13400000000001, "r_x3": 322.306, "r_y3": 156.13400000000001, "coord_origin": "TOPLEFT"}, "text": "</TR><TR>", "orig": "</TR><TR>", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 322.306, "t": 163.274, "r": 374.737, "b": 167.97799999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 167.97799999999995, "r_x1": 374.737, "r_y1": 167.97799999999995, "r_x2": 374.737, "r_y2": 163.274, "r_x3": 322.306, "r_y3": 163.274, "coord_origin": "TOPLEFT"}, "text": "<TD> 3 </TD><TD>...", "orig": "<TD> 3 </TD><TD>...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 322.306, "t": 170.414, "r": 326.557, "b": 175.11800000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 322.306, "r_y0": 175.11800000000005, "r_x1": 326.557, "r_y1": 175.11800000000005, "r_x2": 326.557, "r_y2": 170.414, "r_x3": 322.306, "r_y3": 170.414, "coord_origin": "TOPLEFT"}, "text": "...", "orig": "...", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 323.511, "t": 89.74300000000005, "r": 326.914, "b": 95.38900000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.511, "r_y0": 95.38900000000001, "r_x1": 326.914, "r_y1": 95.38900000000001, "r_x2": 326.914, "r_y2": 89.74300000000005, "r_x3": 323.511, "r_y3": 89.74300000000005, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 323.715, "t": 97.86199999999997, "r": 327.118, "b": 103.50800000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.715, "r_y0": 103.50800000000004, "r_x1": 327.118, "r_y1": 103.50800000000004, "r_x2": 327.118, "r_y2": 97.86199999999997, "r_x3": 323.715, "r_y3": 97.86199999999997, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 323.715, "t": 106.06299999999999, "r": 327.118, "b": 111.70899999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.715, "r_y0": 111.70899999999995, "r_x1": 327.118, "r_y1": 111.70899999999995, "r_x2": 327.118, "r_y2": 106.06299999999999, "r_x3": 323.715, "r_y3": 106.06299999999999, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 454.464, "t": 104.61900000000003, "r": 457.867, "b": 110.26499999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.464, "r_y0": 110.26499999999999, "r_x1": 457.867, "r_y1": 110.26499999999999, "r_x2": 457.867, "r_y2": 104.61900000000003, "r_x3": 454.464, "r_y3": 104.61900000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 493.326, "t": 91.16899999999998, "r": 496.729, "b": 96.81500000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.326, "r_y0": 96.81500000000005, "r_x1": 496.729, "r_y1": 96.81500000000005, "r_x2": 496.729, "r_y2": 91.16899999999998, "r_x3": 493.326, "r_y3": 91.16899999999998, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 454.083, "t": 90.64200000000005, "r": 457.486, "b": 96.28800000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.083, "r_y0": 96.28800000000001, "r_x1": 457.486, "r_y1": 96.28800000000001, "r_x2": 457.486, "r_y2": 90.64200000000005, "r_x3": 454.083, "r_y3": 90.64200000000005, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "caption", "id": 6, "page_no": 4, "cluster": {"id": 6, "label": "caption", "bbox": {"l": 50.112, "t": 203.986, "r": 545.108, "b": 224.88099999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.9677652716636658, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 212.92600000000004, "r_x1": 86.884, "r_y1": 212.92600000000004, "r_x2": 86.884, "r_y2": 204.37400000000002, "r_x3": 50.112, "r_y3": 204.37400000000002, "coord_origin": "TOPLEFT"}, "text": "Figure 3:", "orig": "Figure 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.021, "r_y0": 212.942, "r_x1": 149.851, "r_y1": 212.942, "r_x2": 149.851, "r_y2": 203.986, "r_x3": 94.021, "r_y3": 203.986, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.861, "r_y0": 212.92600000000004, "r_x1": 545.108, "r_y1": 212.92600000000004, "r_x2": 545.108, "r_y2": 204.37400000000002, "r_x3": 152.861, "r_y3": 204.37400000000002, "coord_origin": "TOPLEFT"}, "text": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "orig": "takes in an image of the PDF and creates bounding box and HTML structure predictions that are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 224.88099999999997, "r_x1": 436.013, "r_y1": 224.88099999999997, "r_x2": 436.013, "r_y2": 216.32899999999995, "r_x3": 50.112, "r_y3": 216.32899999999995, "coord_origin": "TOPLEFT"}, "text": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "orig": "synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 3: TableFormer takes in an image of the PDF and creates bounding box and HTML structure predictions that are synchronized. The bounding boxes grabs the content from the PDF and inserts it in the structure."}, {"label": "picture", "id": 5, "page_no": 4, "cluster": {"id": 5, "label": "picture", "bbox": {"l": 53.03328323364258, "t": 257.66534423828125, "r": 285.3731689453125, "b": 507.6688537597656, "coord_origin": "TOPLEFT"}, "confidence": 0.9724942445755005, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 74.253, "r_y0": 263.884, "r_x1": 101.758, "r_y1": 263.884, "r_x2": 101.758, "r_y2": 259.52, "r_x3": 74.253, "r_y3": 259.52, "coord_origin": "TOPLEFT"}, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.3, "r_y0": 264.015, "r_x1": 157.84, "r_y1": 264.015, "r_x2": 157.84, "r_y2": 259.65, "r_x3": 122.3, "r_y3": 259.65, "coord_origin": "TOPLEFT"}, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.549, "r_y0": 376.78, "r_x1": 125.684, "r_y1": 376.78, "r_x2": 125.684, "r_y2": 372.588, "r_x3": 78.549, "r_y3": 372.588, "coord_origin": "TOPLEFT"}, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.513, "r_y0": 396.713, "r_x1": 125.111, "r_y1": 396.713, "r_x2": 125.111, "r_y2": 392.52, "r_x3": 78.513, "r_y3": 392.52, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.025, "r_y0": 429.848, "r_x1": 127.923, "r_y1": 429.848, "r_x2": 127.923, "r_y2": 425.655, "r_x3": 76.025, "r_y3": 425.655, "coord_origin": "TOPLEFT"}, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.383, "r_y0": 450.284, "r_x1": 124.98, "r_y1": 450.284, "r_x2": 124.98, "r_y2": 446.091, "r_x3": 78.383, "r_y3": 446.091, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.469, "r_y0": 467.838, "r_x1": 181.629, "r_y1": 467.838, "r_x2": 181.629, "r_y2": 463.645, "r_x3": 167.469, "r_y3": 463.645, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 165.613, "r_y0": 483.866, "r_x1": 184.432, "r_y1": 483.866, "r_x2": 184.432, "r_y2": 479.673, "r_x3": 165.613, "r_y3": 479.673, "coord_origin": "TOPLEFT"}, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.32, "r_y0": 329.941, "r_x1": 132.925, "r_y1": 329.941, "r_x2": 132.925, "r_y2": 325.527, "r_x3": 65.32, "r_y3": 325.527, "coord_origin": "TOPLEFT"}, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.515, "r_y0": 274.491, "r_x1": 126.837, "r_y1": 274.491, "r_x2": 126.837, "r_y2": 270.73900000000003, "r_x3": 119.515, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "[30,", "orig": "[30,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.2, "r_y0": 274.491, "r_x1": 132.745, "r_y1": 274.491, "r_x2": 132.745, "r_y2": 270.73900000000003, "r_x3": 129.2, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "1,", "orig": "1,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 135.108, "r_y0": 274.491, "r_x1": 138.652, "r_y1": 274.491, "r_x2": 138.652, "r_y2": 270.73900000000003, "r_x3": 135.108, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "2,", "orig": "2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.015, "r_y0": 274.491, "r_x1": 144.56, "r_y1": 274.491, "r_x2": 144.56, "r_y2": 270.73900000000003, "r_x3": 141.015, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "3,", "orig": "3,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 146.923, "r_y0": 274.491, "r_x1": 160.625, "r_y1": 274.491, "r_x2": 160.625, "r_y2": 270.73900000000003, "r_x3": 146.923, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "4, \u20263,", "orig": "4, \u20263,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.729, "r_y0": 279.741, "r_x1": 132.273, "r_y1": 279.741, "r_x2": 132.273, "r_y2": 275.98900000000003, "r_x3": 128.729, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "4,", "orig": "4,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.636, "r_y0": 279.741, "r_x1": 138.181, "r_y1": 279.741, "r_x2": 138.181, "r_y2": 275.98900000000003, "r_x3": 134.636, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "5,", "orig": "5,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.544, "r_y0": 279.741, "r_x1": 151.411, "r_y1": 279.741, "r_x2": 151.411, "r_y2": 275.98900000000003, "r_x3": 140.544, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "8, 31]", "orig": "8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.434, "r_y0": 343.926, "r_x1": 79.019, "r_y1": 343.926, "r_x2": 79.019, "r_y2": 340.521, "r_x3": 60.434, "r_y3": 340.521, "coord_origin": "TOPLEFT"}, "text": "Positional", "orig": "Positional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.598, "r_y0": 348.352, "r_x1": 78.855, "r_y1": 348.352, "r_x2": 78.855, "r_y2": 344.948, "r_x3": 60.598, "r_y3": 344.948, "coord_origin": "TOPLEFT"}, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.829, "r_y0": 298.344, "r_x1": 153.414, "r_y1": 298.344, "r_x2": 153.414, "r_y2": 294.939, "r_x3": 134.829, "r_y3": 294.939, "coord_origin": "TOPLEFT"}, "text": "Positional", "orig": "Positional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.993, "r_y0": 302.77, "r_x1": 153.25, "r_y1": 302.77, "r_x2": 153.25, "r_y2": 299.365, "r_x3": 134.993, "r_y3": 299.365, "coord_origin": "TOPLEFT"}, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 350.753, "r_x1": 197.149, "r_y1": 350.753, "r_x2": 197.149, "r_y2": 346.56, "r_x3": 150.552, "r_y3": 346.56, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 399.818, "r_x1": 197.149, "r_y1": 399.818, "r_x2": 197.149, "r_y2": 395.625, "r_x3": 150.552, "r_y3": 395.625, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.185, "r_y0": 381.063, "r_x1": 197.32, "r_y1": 381.063, "r_x2": 197.32, "r_y2": 376.87, "r_x3": 150.185, "r_y3": 376.87, "coord_origin": "TOPLEFT"}, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 445.643, "r_x1": 197.149, "r_y1": 445.643, "r_x2": 197.149, "r_y2": 441.45, "r_x3": 150.552, "r_y3": 441.45, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.864, "r_y0": 427.488, "r_x1": 199.762, "r_y1": 427.488, "r_x2": 199.762, "r_y2": 423.295, "r_x3": 147.864, "r_y3": 423.295, "coord_origin": "TOPLEFT"}, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.566, "r_y0": 319.657, "r_x1": 255.725, "r_y1": 319.657, "r_x2": 255.725, "r_y2": 315.465, "r_x3": 241.566, "r_y3": 315.465, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.917, "r_y0": 366.759, "r_x1": 256.077, "r_y1": 366.759, "r_x2": 256.077, "r_y2": 362.567, "r_x3": 241.917, "r_y3": 362.567, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.054, "r_y0": 342.014, "r_x1": 269.393, "r_y1": 342.014, "r_x2": 269.393, "r_y2": 337.821, "r_x3": 228.054, "r_y3": 337.821, "coord_origin": "TOPLEFT"}, "text": "Attention Network", "orig": "Attention Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.446, "r_y0": 410.541, "r_x1": 238.739, "r_y1": 410.541, "r_x2": 238.739, "r_y2": 406.349, "r_x3": 228.446, "r_y3": 406.349, "coord_origin": "TOPLEFT"}, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.298, "r_y0": 410.598, "r_x1": 270.457, "r_y1": 410.598, "r_x2": 270.457, "r_y2": 406.405, "r_x3": 256.298, "r_y3": 406.405, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.545, "r_y0": 387.608, "r_x1": 258.089, "r_y1": 387.608, "r_x2": 258.089, "r_y2": 383.415, "r_x3": 239.545, "r_y3": 383.415, "coord_origin": "TOPLEFT"}, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 59.258, "r_y0": 449.783, "r_x1": 59.245, "r_y1": 384.871, "r_x2": 55.273, "r_y2": 384.872, "r_x3": 55.286, "r_y3": 449.784, "coord_origin": "TOPLEFT"}, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 59.058, "r_y0": 378.454, "r_x1": 59.055, "r_y1": 373.809, "r_x2": 55.345, "r_y2": 373.812, "r_x3": 55.348, "r_y3": 378.457, "coord_origin": "TOPLEFT"}, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.296, "r_y0": 490.108, "r_x1": 122.166, "r_y1": 490.098, "r_x2": 122.165, "r_y2": 485.687, "r_x3": 85.295, "r_y3": 485.697, "coord_origin": "TOPLEFT"}, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.666, "r_y0": 285.074, "r_x1": 265.321, "r_y1": 285.064, "r_x2": 265.32, "r_y2": 281.281, "r_x3": 229.665, "r_y3": 281.291, "coord_origin": "TOPLEFT"}, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.174, "r_y0": 505.871, "r_x1": 190.419, "r_y1": 505.862, "r_x2": 190.417, "r_y2": 501.45, "r_x3": 157.172, "r_y3": 501.459, "coord_origin": "TOPLEFT"}, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.816, "r_y0": 443.634, "r_x1": 269.396, "r_y1": 443.622, "r_x2": 269.395, "r_y2": 439.211, "r_x3": 227.815, "r_y3": 439.222, "coord_origin": "TOPLEFT"}, "text": "Bounding Boxes &", "orig": "Bounding Boxes &", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.703, "r_y0": 449.632, "r_x1": 263.513, "r_y1": 449.624, "r_x2": 263.511, "r_y2": 445.212, "r_x3": 233.701, "r_y3": 445.22, "coord_origin": "TOPLEFT"}, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.747, "r_y0": 298.506, "r_x1": 210.91, "r_y1": 298.506, "r_x2": 210.91, "r_y2": 294.534, "r_x3": 184.747, "r_y3": 294.534, "coord_origin": "TOPLEFT"}, "text": "Transformer", "orig": "Transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.912, "r_y0": 304.256, "r_x1": 216.744, "r_y1": 304.256, "r_x2": 216.744, "r_y2": 300.284, "r_x3": 178.912, "r_y3": 300.284, "coord_origin": "TOPLEFT"}, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.246, "r_y0": 287.601, "r_x1": 198.891, "r_y1": 287.601, "r_x2": 198.891, "r_y2": 283.891, "r_x3": 194.246, "r_y3": 283.891, "coord_origin": "TOPLEFT"}, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.456, "r_y0": 277.548, "r_x1": 276.471, "r_y1": 277.548, "r_x2": 276.471, "r_y2": 273.134, "r_x3": 221.456, "r_y3": 273.134, "coord_origin": "TOPLEFT"}, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.652, "r_y0": 328.837, "r_x1": 195.97, "r_y1": 328.837, "r_x2": 195.97, "r_y2": 324.644, "r_x3": 151.652, "r_y3": 324.644, "coord_origin": "TOPLEFT"}, "text": "Masked Multi-Head", "orig": "Masked Multi-Head", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.433, "r_y0": 334.837, "r_x1": 184.19, "r_y1": 334.837, "r_x2": 184.19, "r_y2": 330.644, "r_x3": 163.433, "r_y3": 330.644, "coord_origin": "TOPLEFT"}, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 64, "label": "text", "bbox": {"l": 74.253, "t": 259.52, "r": 101.758, "b": 263.884, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 74.253, "r_y0": 263.884, "r_x1": 101.758, "r_y1": 263.884, "r_x2": 101.758, "r_y2": 259.52, "r_x3": 74.253, "r_y3": 259.52, "coord_origin": "TOPLEFT"}, "text": "Input Image", "orig": "Input Image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 122.3, "t": 259.65, "r": 157.84, "b": 264.015, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.3, "r_y0": 264.015, "r_x1": 157.84, "r_y1": 264.015, "r_x2": 157.84, "r_y2": 259.65, "r_x3": 122.3, "r_y3": 259.65, "coord_origin": "TOPLEFT"}, "text": "Tokenised Tags", "orig": "Tokenised Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 78.549, "t": 372.588, "r": 125.684, "b": 376.78, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.549, "r_y0": 376.78, "r_x1": 125.684, "r_y1": 376.78, "r_x2": 125.684, "r_y2": 372.588, "r_x3": 78.549, "r_y3": 372.588, "coord_origin": "TOPLEFT"}, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 78.513, "t": 392.52, "r": 125.111, "b": 396.713, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.513, "r_y0": 396.713, "r_x1": 125.111, "r_y1": 396.713, "r_x2": 125.111, "r_y2": 392.52, "r_x3": 78.513, "r_y3": 392.52, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 76.025, "t": 425.655, "r": 127.923, "b": 429.848, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.025, "r_y0": 429.848, "r_x1": 127.923, "r_y1": 429.848, "r_x2": 127.923, "r_y2": 425.655, "r_x3": 76.025, "r_y3": 425.655, "coord_origin": "TOPLEFT"}, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 78.383, "t": 446.091, "r": 124.98, "b": 450.284, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.383, "r_y0": 450.284, "r_x1": 124.98, "r_y1": 450.284, "r_x2": 124.98, "r_y2": 446.091, "r_x3": 78.383, "r_y3": 446.091, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 167.469, "t": 463.645, "r": 181.629, "b": 467.838, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.469, "r_y0": 467.838, "r_x1": 181.629, "r_y1": 467.838, "r_x2": 181.629, "r_y2": 463.645, "r_x3": 167.469, "r_y3": 463.645, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 165.613, "t": 479.673, "r": 184.432, "b": 483.866, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 165.613, "r_y0": 483.866, "r_x1": 184.432, "r_y1": 483.866, "r_x2": 184.432, "r_y2": 479.673, "r_x3": 165.613, "r_y3": 479.673, "coord_origin": "TOPLEFT"}, "text": "Softmax", "orig": "Softmax", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 65.32, "t": 325.527, "r": 132.925, "b": 329.941, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.32, "r_y0": 329.941, "r_x1": 132.925, "r_y1": 329.941, "r_x2": 132.925, "r_y2": 325.527, "r_x3": 65.32, "r_y3": 325.527, "coord_origin": "TOPLEFT"}, "text": "CNN BACKBONE ENCODER", "orig": "CNN BACKBONE ENCODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 119.515, "t": 270.73900000000003, "r": 126.837, "b": 274.491, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.515, "r_y0": 274.491, "r_x1": 126.837, "r_y1": 274.491, "r_x2": 126.837, "r_y2": 270.73900000000003, "r_x3": 119.515, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "[30,", "orig": "[30,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 129.2, "t": 270.73900000000003, "r": 132.745, "b": 274.491, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.2, "r_y0": 274.491, "r_x1": 132.745, "r_y1": 274.491, "r_x2": 132.745, "r_y2": 270.73900000000003, "r_x3": 129.2, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "1,", "orig": "1,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 135.108, "t": 270.73900000000003, "r": 138.652, "b": 274.491, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 135.108, "r_y0": 274.491, "r_x1": 138.652, "r_y1": 274.491, "r_x2": 138.652, "r_y2": 270.73900000000003, "r_x3": 135.108, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "2,", "orig": "2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 141.015, "t": 270.73900000000003, "r": 144.56, "b": 274.491, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.015, "r_y0": 274.491, "r_x1": 144.56, "r_y1": 274.491, "r_x2": 144.56, "r_y2": 270.73900000000003, "r_x3": 141.015, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "3,", "orig": "3,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 146.923, "t": 270.73900000000003, "r": 160.625, "b": 274.491, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 146.923, "r_y0": 274.491, "r_x1": 160.625, "r_y1": 274.491, "r_x2": 160.625, "r_y2": 270.73900000000003, "r_x3": 146.923, "r_y3": 270.73900000000003, "coord_origin": "TOPLEFT"}, "text": "4, \u20263,", "orig": "4, \u20263,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 128.729, "t": 275.98900000000003, "r": 132.273, "b": 279.741, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.729, "r_y0": 279.741, "r_x1": 132.273, "r_y1": 279.741, "r_x2": 132.273, "r_y2": 275.98900000000003, "r_x3": 128.729, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "4,", "orig": "4,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 134.636, "t": 275.98900000000003, "r": 138.181, "b": 279.741, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.636, "r_y0": 279.741, "r_x1": 138.181, "r_y1": 279.741, "r_x2": 138.181, "r_y2": 275.98900000000003, "r_x3": 134.636, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "5,", "orig": "5,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 140.544, "t": 275.98900000000003, "r": 151.411, "b": 279.741, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.544, "r_y0": 279.741, "r_x1": 151.411, "r_y1": 279.741, "r_x2": 151.411, "r_y2": 275.98900000000003, "r_x3": 140.544, "r_y3": 275.98900000000003, "coord_origin": "TOPLEFT"}, "text": "8, 31]", "orig": "8, 31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 60.434, "t": 340.521, "r": 79.019, "b": 343.926, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.434, "r_y0": 343.926, "r_x1": 79.019, "r_y1": 343.926, "r_x2": 79.019, "r_y2": 340.521, "r_x3": 60.434, "r_y3": 340.521, "coord_origin": "TOPLEFT"}, "text": "Positional", "orig": "Positional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 82, "label": "text", "bbox": {"l": 60.598, "t": 344.948, "r": 78.855, "b": 348.352, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.598, "r_y0": 348.352, "r_x1": 78.855, "r_y1": 348.352, "r_x2": 78.855, "r_y2": 344.948, "r_x3": 60.598, "r_y3": 344.948, "coord_origin": "TOPLEFT"}, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 83, "label": "text", "bbox": {"l": 134.829, "t": 294.939, "r": 153.414, "b": 298.344, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.829, "r_y0": 298.344, "r_x1": 153.414, "r_y1": 298.344, "r_x2": 153.414, "r_y2": 294.939, "r_x3": 134.829, "r_y3": 294.939, "coord_origin": "TOPLEFT"}, "text": "Positional", "orig": "Positional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 134.993, "t": 299.365, "r": 153.25, "b": 302.77, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.993, "r_y0": 302.77, "r_x1": 153.25, "r_y1": 302.77, "r_x2": 153.25, "r_y2": 299.365, "r_x3": 134.993, "r_y3": 299.365, "coord_origin": "TOPLEFT"}, "text": "Encoding", "orig": "Encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 150.552, "t": 346.56, "r": 197.149, "b": 350.753, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 350.753, "r_x1": 197.149, "r_y1": 350.753, "r_x2": 197.149, "r_y2": 346.56, "r_x3": 150.552, "r_y3": 346.56, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 86, "label": "text", "bbox": {"l": 150.552, "t": 395.625, "r": 197.149, "b": 399.818, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 399.818, "r_x1": 197.149, "r_y1": 399.818, "r_x2": 197.149, "r_y2": 395.625, "r_x3": 150.552, "r_y3": 395.625, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 150.185, "t": 376.87, "r": 197.32, "b": 381.063, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.185, "r_y0": 381.063, "r_x1": 197.32, "r_y1": 381.063, "r_x2": 197.32, "r_y2": 376.87, "r_x3": 150.185, "r_y3": 376.87, "coord_origin": "TOPLEFT"}, "text": "Multi-Head Attention", "orig": "Multi-Head Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 88, "label": "text", "bbox": {"l": 150.552, "t": 441.45, "r": 197.149, "b": 445.643, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 150.552, "r_y0": 445.643, "r_x1": 197.149, "r_y1": 445.643, "r_x2": 197.149, "r_y2": 441.45, "r_x3": 150.552, "r_y3": 441.45, "coord_origin": "TOPLEFT"}, "text": "Add & Normalisation", "orig": "Add & Normalisation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 147.864, "t": 423.295, "r": 199.762, "b": 427.488, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.864, "r_y0": 427.488, "r_x1": 199.762, "r_y1": 427.488, "r_x2": 199.762, "r_y2": 423.295, "r_x3": 147.864, "r_y3": 423.295, "coord_origin": "TOPLEFT"}, "text": "Feed Forward Network", "orig": "Feed Forward Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 241.566, "t": 315.465, "r": 255.725, "b": 319.657, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.566, "r_y0": 319.657, "r_x1": 255.725, "r_y1": 319.657, "r_x2": 255.725, "r_y2": 315.465, "r_x3": 241.566, "r_y3": 315.465, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 91, "label": "text", "bbox": {"l": 241.917, "t": 362.567, "r": 256.077, "b": 366.759, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.917, "r_y0": 366.759, "r_x1": 256.077, "r_y1": 366.759, "r_x2": 256.077, "r_y2": 362.567, "r_x3": 241.917, "r_y3": 362.567, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 92, "label": "text", "bbox": {"l": 228.054, "t": 337.821, "r": 269.393, "b": 342.014, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.054, "r_y0": 342.014, "r_x1": 269.393, "r_y1": 342.014, "r_x2": 269.393, "r_y2": 337.821, "r_x3": 228.054, "r_y3": 337.821, "coord_origin": "TOPLEFT"}, "text": "Attention Network", "orig": "Attention Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 93, "label": "text", "bbox": {"l": 228.446, "t": 406.349, "r": 238.739, "b": 410.541, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.446, "r_y0": 410.541, "r_x1": 238.739, "r_y1": 410.541, "r_x2": 238.739, "r_y2": 406.349, "r_x3": 228.446, "r_y3": 406.349, "coord_origin": "TOPLEFT"}, "text": "MLP", "orig": "MLP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 94, "label": "text", "bbox": {"l": 256.298, "t": 406.405, "r": 270.457, "b": 410.598, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.298, "r_y0": 410.598, "r_x1": 270.457, "r_y1": 410.598, "r_x2": 270.457, "r_y2": 406.405, "r_x3": 256.298, "r_y3": 406.405, "coord_origin": "TOPLEFT"}, "text": "Linear", "orig": "Linear", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 95, "label": "text", "bbox": {"l": 239.545, "t": 383.415, "r": 258.089, "b": 387.608, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.545, "r_y0": 387.608, "r_x1": 258.089, "r_y1": 387.608, "r_x2": 258.089, "r_y2": 383.415, "r_x3": 239.545, "r_y3": 383.415, "coord_origin": "TOPLEFT"}, "text": "Sigmoid", "orig": "Sigmoid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 96, "label": "text", "bbox": {"l": 55.273, "t": 384.871, "r": 59.258, "b": 449.784, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 59.258, "r_y0": 449.783, "r_x1": 59.245, "r_y1": 384.871, "r_x2": 55.273, "r_y2": 384.872, "r_x3": 55.286, "r_y3": 449.784, "coord_origin": "TOPLEFT"}, "text": "Transformer Encoder Network", "orig": "Transformer Encoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 97, "label": "text", "bbox": {"l": 55.345, "t": 373.809, "r": 59.058, "b": 378.457, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 59.058, "r_y0": 378.454, "r_x1": 59.055, "r_y1": 373.809, "r_x2": 55.345, "r_y2": 373.812, "r_x3": 55.348, "r_y3": 378.457, "coord_origin": "TOPLEFT"}, "text": "x2", "orig": "x2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 98, "label": "text", "bbox": {"l": 85.295, "t": 485.687, "r": 122.166, "b": 490.108, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.296, "r_y0": 490.108, "r_x1": 122.166, "r_y1": 490.098, "r_x2": 122.165, "r_y2": 485.687, "r_x3": 85.295, "r_y3": 485.697, "coord_origin": "TOPLEFT"}, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 99, "label": "text", "bbox": {"l": 229.665, "t": 281.281, "r": 265.321, "b": 285.074, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.666, "r_y0": 285.074, "r_x1": 265.321, "r_y1": 285.064, "r_x2": 265.32, "r_y2": 281.281, "r_x3": 229.665, "r_y3": 281.291, "coord_origin": "TOPLEFT"}, "text": "Encoded Output", "orig": "Encoded Output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 100, "label": "text", "bbox": {"l": 157.172, "t": 501.45, "r": 190.419, "b": 505.871, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.174, "r_y0": 505.871, "r_x1": 190.419, "r_y1": 505.862, "r_x2": 190.417, "r_y2": 501.45, "r_x3": 157.172, "r_y3": 501.459, "coord_origin": "TOPLEFT"}, "text": "Predicted Tags", "orig": "Predicted Tags", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 101, "label": "text", "bbox": {"l": 227.815, "t": 439.211, "r": 269.396, "b": 443.634, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.816, "r_y0": 443.634, "r_x1": 269.396, "r_y1": 443.622, "r_x2": 269.395, "r_y2": 439.211, "r_x3": 227.815, "r_y3": 439.222, "coord_origin": "TOPLEFT"}, "text": "Bounding Boxes &", "orig": "Bounding Boxes &", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 102, "label": "text", "bbox": {"l": 233.701, "t": 445.212, "r": 263.513, "b": 449.632, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.703, "r_y0": 449.632, "r_x1": 263.513, "r_y1": 449.624, "r_x2": 263.511, "r_y2": 445.212, "r_x3": 233.701, "r_y3": 445.22, "coord_origin": "TOPLEFT"}, "text": "Classification", "orig": "Classification", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 103, "label": "text", "bbox": {"l": 184.747, "t": 294.534, "r": 210.91, "b": 298.506, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.747, "r_y0": 298.506, "r_x1": 210.91, "r_y1": 298.506, "r_x2": 210.91, "r_y2": 294.534, "r_x3": 184.747, "r_y3": 294.534, "coord_origin": "TOPLEFT"}, "text": "Transformer", "orig": "Transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 104, "label": "text", "bbox": {"l": 178.912, "t": 300.284, "r": 216.744, "b": 304.256, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.912, "r_y0": 304.256, "r_x1": 216.744, "r_y1": 304.256, "r_x2": 216.744, "r_y2": 300.284, "r_x3": 178.912, "r_y3": 300.284, "coord_origin": "TOPLEFT"}, "text": "Decoder Network", "orig": "Decoder Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 105, "label": "text", "bbox": {"l": 194.246, "t": 283.891, "r": 198.891, "b": 287.601, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.246, "r_y0": 287.601, "r_x1": 198.891, "r_y1": 287.601, "r_x2": 198.891, "r_y2": 283.891, "r_x3": 194.246, "r_y3": 283.891, "coord_origin": "TOPLEFT"}, "text": "x4", "orig": "x4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 106, "label": "text", "bbox": {"l": 221.456, "t": 273.134, "r": 276.471, "b": 277.548, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.456, "r_y0": 277.548, "r_x1": 276.471, "r_y1": 277.548, "r_x2": 276.471, "r_y2": 273.134, "r_x3": 221.456, "r_y3": 273.134, "coord_origin": "TOPLEFT"}, "text": "CELL BBOX DECODER", "orig": "CELL BBOX DECODER", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 107, "label": "text", "bbox": {"l": 151.652, "t": 324.644, "r": 195.97, "b": 328.837, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.652, "r_y0": 328.837, "r_x1": 195.97, "r_y1": 328.837, "r_x2": 195.97, "r_y2": 324.644, "r_x3": 151.652, "r_y3": 324.644, "coord_origin": "TOPLEFT"}, "text": "Masked Multi-Head", "orig": "Masked Multi-Head", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 108, "label": "text", "bbox": {"l": 163.433, "t": 330.644, "r": 184.19, "b": 334.837, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 163.433, "r_y0": 334.837, "r_x1": 184.19, "r_y1": 334.837, "r_x2": 184.19, "r_y2": 330.644, "r_x3": 163.433, "r_y3": 330.644, "coord_origin": "TOPLEFT"}, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "caption", "id": 8, "page_no": 4, "cluster": {"id": 8, "label": "caption", "bbox": {"l": 50.112, "t": 527.783, "r": 286.366, "b": 680.185, "coord_origin": "TOPLEFT"}, "confidence": 0.8913407325744629, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 536.723, "r_x1": 85.878, "r_y1": 536.723, "r_x2": 85.878, "r_y2": 528.171, "r_x3": 50.112, "r_y3": 528.171, "coord_origin": "TOPLEFT"}, "text": "Figure 4:", "orig": "Figure 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 90.73, "r_y0": 536.723, "r_x1": 229.787, "r_y1": 536.723, "r_x2": 229.787, "r_y2": 528.171, "r_x3": 90.73, "r_y3": 528.171, "coord_origin": "TOPLEFT"}, "text": "Given an input image of a table, the", "orig": "Given an input image of a table, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 231.787, "r_y0": 536.739, "r_x1": 267.762, "r_y1": 536.739, "r_x2": 267.762, "r_y2": 527.783, "r_x3": 231.787, "r_y3": 527.783, "coord_origin": "TOPLEFT"}, "text": "Encoder", "orig": "Encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 269.764, "r_y0": 536.723, "r_x1": 286.362, "r_y1": 536.723, "r_x2": 286.362, "r_y2": 528.171, "r_x3": 269.764, "r_y3": 528.171, "coord_origin": "TOPLEFT"}, "text": "pro-", "orig": "pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 548.678, "r_x1": 286.365, "r_y1": 548.678, "r_x2": 286.365, "r_y2": 540.126, "r_x3": 50.112, "r_y3": 540.126, "coord_origin": "TOPLEFT"}, "text": "duces fixed-length features that represent the input image.", "orig": "duces fixed-length features that represent the input image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 560.634, "r_x1": 205.847, "r_y1": 560.634, "r_x2": 205.847, "r_y2": 552.082, "r_x3": 50.112, "r_y3": 552.082, "coord_origin": "TOPLEFT"}, "text": "The features are then passed to both the", "orig": "The features are then passed to both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.018, "r_y0": 560.65, "r_x1": 286.364, "r_y1": 560.65, "r_x2": 286.364, "r_y2": 551.694, "r_x3": 208.018, "r_y3": 551.694, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 572.5889999999999, "r_x1": 64.498, "r_y1": 572.5889999999999, "r_x2": 64.498, "r_y2": 564.037, "r_x3": 50.112, "r_y3": 564.037, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 68.165, "r_y0": 572.605, "r_x1": 151.313, "r_y1": 572.605, "r_x2": 151.313, "r_y2": 563.649, "r_x3": 68.165, "r_y3": 563.649, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 151.313, "r_y0": 572.5889999999999, "r_x1": 153.804, "r_y1": 572.5889999999999, "r_x2": 153.804, "r_y2": 564.037, "r_x3": 151.313, "r_y3": 564.037, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.419, "r_y0": 572.5889999999999, "r_x1": 241.933, "r_y1": 572.5889999999999, "r_x2": 241.933, "r_y2": 564.037, "r_x3": 160.419, "r_y3": 564.037, "coord_origin": "TOPLEFT"}, "text": "During training, the", "orig": "During training, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.595, "r_y0": 572.605, "r_x1": 286.362, "r_y1": 572.605, "r_x2": 286.362, "r_y2": 563.649, "r_x3": 245.595, "r_y3": 563.649, "coord_origin": "TOPLEFT"}, "text": "Structure", "orig": "Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 584.56, "r_x1": 85.519, "r_y1": 584.56, "r_x2": 85.519, "r_y2": 575.604, "r_x3": 50.112, "r_y3": 575.604, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.623, "r_y0": 584.544, "r_x1": 286.361, "r_y1": 584.544, "r_x2": 286.361, "r_y2": 575.992, "r_x3": 88.623, "r_y3": 575.992, "coord_origin": "TOPLEFT"}, "text": "receives 'tokenized tags' of the HTML code that", "orig": "receives 'tokenized tags' of the HTML code that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 596.499, "r_x1": 286.365, "r_y1": 596.499, "r_x2": 286.365, "r_y2": 587.947, "r_x3": 50.112, "r_y3": 587.947, "coord_origin": "TOPLEFT"}, "text": "represent the table structure. Afterwards, a transformer en-", "orig": "represent the table structure. Afterwards, a transformer en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 608.454, "r_x1": 286.365, "r_y1": 608.454, "r_x2": 286.365, "r_y2": 599.902, "r_x3": 50.112, "r_y3": 599.902, "coord_origin": "TOPLEFT"}, "text": "coder and decoder architecture is employed to produce fea-", "orig": "coder and decoder architecture is employed to produce fea-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 620.409, "r_x1": 240.438, "r_y1": 620.409, "r_x2": 240.438, "r_y2": 611.857, "r_x3": 50.112, "r_y3": 611.857, "coord_origin": "TOPLEFT"}, "text": "tures that are received by a linear layer, and the", "orig": "tures that are received by a linear layer, and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.198, "r_y0": 620.425, "r_x1": 286.366, "r_y1": 620.425, "r_x2": 286.366, "r_y2": 611.469, "r_x3": 243.198, "r_y3": 611.469, "coord_origin": "TOPLEFT"}, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 632.381, "r_x1": 87.013, "r_y1": 632.381, "r_x2": 87.013, "r_y2": 623.425, "r_x3": 50.112, "r_y3": 623.425, "coord_origin": "TOPLEFT"}, "text": "Decoder.", "orig": "Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.14, "r_y0": 632.381, "r_x1": 286.365, "r_y1": 632.381, "r_x2": 286.365, "r_y2": 623.425, "r_x3": 93.14, "r_y3": 623.425, "coord_origin": "TOPLEFT"}, "text": "The linear layer is applied to the features to", "orig": "The linear layer is applied to the features to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 644.336, "r_x1": 286.365, "r_y1": 644.336, "r_x2": 286.365, "r_y2": 635.38, "r_x3": 50.112, "r_y3": 635.38, "coord_origin": "TOPLEFT"}, "text": "predict the tags. Simultaneously, the Cell BBox Decoder", "orig": "predict the tags. Simultaneously, the Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 656.275, "r_x1": 220.582, "r_y1": 656.275, "r_x2": 220.582, "r_y2": 647.723, "r_x3": 50.112, "r_y3": 647.723, "coord_origin": "TOPLEFT"}, "text": "selects features referring to the data cells ('", "orig": "selects features referring to the data cells ('", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.578, "r_y0": 656.111, "r_x1": 228.327, "r_y1": 656.111, "r_x2": 228.327, "r_y2": 647.405, "r_x3": 220.578, "r_y3": 647.405, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.327, "r_y0": 656.275, "r_x1": 236.078, "r_y1": 656.275, "r_x2": 236.078, "r_y2": 647.723, "r_x3": 228.327, "r_y3": 647.723, "coord_origin": "TOPLEFT"}, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.078, "r_y0": 656.111, "r_x1": 243.827, "r_y1": 656.111, "r_x2": 243.827, "r_y2": 647.405, "r_x3": 236.078, "r_y3": 647.405, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.826, "r_y0": 656.275, "r_x1": 255.293, "r_y1": 656.275, "r_x2": 255.293, "r_y2": 647.723, "r_x3": 243.826, "r_y3": 647.723, "coord_origin": "TOPLEFT"}, "text": "', '", "orig": "', '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.291, "r_y0": 656.111, "r_x1": 263.04, "r_y1": 656.111, "r_x2": 263.04, "r_y2": 647.405, "r_x3": 255.291, "r_y3": 647.405, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.04, "r_y0": 656.275, "r_x1": 286.362, "r_y1": 656.275, "r_x2": 286.362, "r_y2": 647.723, "r_x3": 263.04, "r_y3": 647.723, "coord_origin": "TOPLEFT"}, "text": "') and", "orig": "') and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 668.23, "r_x1": 286.365, "r_y1": 668.23, "r_x2": 286.365, "r_y2": 659.678, "r_x3": 50.112, "r_y3": 659.678, "coord_origin": "TOPLEFT"}, "text": "passes them through an attention network, an MLP, and a", "orig": "passes them through an attention network, an MLP, and a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 680.185, "r_x1": 218.47, "r_y1": 680.185, "r_x2": 218.47, "r_y2": 671.633, "r_x3": 50.112, "r_y3": 671.633, "coord_origin": "TOPLEFT"}, "text": "linear layer to predict the bounding boxes.", "orig": "linear layer to predict the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 4: Given an input image of a table, the Encoder produces fixed-length features that represent the input image. The features are then passed to both the Structure Decoder and Cell BBox Decoder . During training, the Structure Decoder receives 'tokenized tags' of the HTML code that represent the table structure. Afterwards, a transformer encoder and decoder architecture is employed to produce features that are received by a linear layer, and the Cell BBox Decoder. The linear layer is applied to the features to predict the tags. Simultaneously, the Cell BBox Decoder selects features referring to the data cells (' < td > ', ' < ') and passes them through an attention network, an MLP, and a linear layer to predict the bounding boxes."}, {"label": "text", "id": 4, "page_no": 4, "cluster": {"id": 4, "label": "text", "bbox": {"l": 308.862, "t": 249.803, "r": 545.115, "b": 294.221, "coord_origin": "TOPLEFT"}, "confidence": 0.9831458330154419, "cells": [{"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 258.355, "r_x1": 545.115, "r_y1": 258.355, "r_x2": 545.115, "r_y2": 249.803, "r_x3": 308.862, "r_y3": 249.803, "coord_origin": "TOPLEFT"}, "text": "forming classification, and adding an adaptive pooling layer", "orig": "forming classification, and adding an adaptive pooling layer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 270.31100000000004, "r_x1": 366.466, "r_y1": 270.31100000000004, "r_x2": 366.466, "r_y2": 261.759, "r_x3": 308.862, "r_y3": 261.759, "coord_origin": "TOPLEFT"}, "text": "of size 28*28.", "orig": "of size 28*28.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 371.706, "r_y0": 270.31100000000004, "r_x1": 545.115, "r_y1": 270.31100000000004, "r_x2": 545.115, "r_y2": 261.759, "r_x3": 371.706, "r_y3": 261.759, "coord_origin": "TOPLEFT"}, "text": "ResNet by default downsamples the image", "orig": "ResNet by default downsamples the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 282.266, "r_x1": 545.115, "r_y1": 282.266, "r_x2": 545.115, "r_y2": 273.71400000000006, "r_x3": 308.862, "r_y3": 273.71400000000006, "coord_origin": "TOPLEFT"}, "text": "resolution by 32 and then the encoded image is provided to", "orig": "resolution by 32 and then the encoded image is provided to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 294.221, "r_x1": 341.24, "r_y1": 294.221, "r_x2": 341.24, "r_y2": 285.669, "r_x3": 308.862, "r_y3": 285.669, "coord_origin": "TOPLEFT"}, "text": "both the", "orig": "both the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 343.731, "r_y0": 294.078, "r_x1": 417.235, "r_y1": 294.078, "r_x2": 417.235, "r_y2": 285.49, "r_x3": 343.731, "r_y3": 285.49, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 417.234, "r_y0": 294.221, "r_x1": 436.601, "r_y1": 294.221, "r_x2": 436.601, "r_y2": 285.669, "r_x3": 417.234, "r_y3": 285.669, "coord_origin": "TOPLEFT"}, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.092, "r_y0": 294.078, "r_x1": 516.561, "r_y1": 294.078, "r_x2": 516.561, "r_y2": 285.49, "r_x3": 439.092, "r_y3": 285.49, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.561, "r_y0": 294.221, "r_x1": 519.052, "r_y1": 294.221, "r_x2": 519.052, "r_y2": 285.669, "r_x3": 516.561, "r_y3": 285.669, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "forming classification, and adding an adaptive pooling layer of size 28*28. ResNet by default downsamples the image resolution by 32 and then the encoded image is provided to both the Structure Decoder , and Cell BBox Decoder ."}, {"label": "text", "id": 1, "page_no": 4, "cluster": {"id": 1, "label": "text", "bbox": {"l": 308.862, "t": 297.34, "r": 545.115, "b": 413.876, "coord_origin": "TOPLEFT"}, "confidence": 0.9862009882926941, "cells": [{"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 306.296, "r_x1": 400.866, "r_y1": 306.296, "r_x2": 400.866, "r_y2": 297.34, "r_x3": 320.817, "r_y3": 297.34, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder.", "orig": "Structure Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 403.914, "r_y0": 306.28, "r_x1": 545.114, "r_y1": 306.28, "r_x2": 545.114, "r_y2": 297.728, "r_x3": 403.914, "r_y3": 297.728, "coord_origin": "TOPLEFT"}, "text": "The transformer architecture of this", "orig": "The transformer architecture of this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 318.235, "r_x1": 517.529, "r_y1": 318.235, "r_x2": 517.529, "r_y2": 309.683, "r_x3": 308.862, "r_y3": 309.683, "coord_origin": "TOPLEFT"}, "text": "component is based on the work proposed in [31].", "orig": "component is based on the work proposed in [31].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 524.094, "r_y0": 318.235, "r_x1": 545.115, "r_y1": 318.235, "r_x2": 545.115, "r_y2": 309.683, "r_x3": 524.094, "r_y3": 309.683, "coord_origin": "TOPLEFT"}, "text": "After", "orig": "After", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 330.19, "r_x1": 432.358, "r_y1": 330.19, "r_x2": 432.358, "r_y2": 321.638, "r_x3": 308.862, "r_y3": 321.638, "coord_origin": "TOPLEFT"}, "text": "extensive experimentation, the", "orig": "extensive experimentation, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 435.82, "r_y0": 330.047, "r_x1": 510.29, "r_y1": 330.047, "r_x2": 510.29, "r_y2": 321.459, "r_x3": 435.82, "r_y3": 321.459, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.978, "r_y0": 330.19, "r_x1": 520.623, "r_y1": 330.19, "r_x2": 520.623, "r_y2": 321.638, "r_x3": 513.978, "r_y3": 321.638, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 524.08, "r_y0": 330.19, "r_x1": 545.111, "r_y1": 330.19, "r_x2": 545.111, "r_y2": 321.638, "r_x3": 524.08, "r_y3": 321.638, "coord_origin": "TOPLEFT"}, "text": "mod-", "orig": "mod-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 342.145, "r_x1": 545.115, "r_y1": 342.145, "r_x2": 545.115, "r_y2": 333.593, "r_x3": 308.862, "r_y3": 333.593, "coord_origin": "TOPLEFT"}, "text": "eled as a transformer encoder with two encoder layers and", "orig": "eled as a transformer encoder with two encoder layers and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 354.1, "r_x1": 545.115, "r_y1": 354.1, "r_x2": 545.115, "r_y2": 345.548, "r_x3": 308.862, "r_y3": 345.548, "coord_origin": "TOPLEFT"}, "text": "a transformer decoder made from a stack of 4 decoder lay-", "orig": "a transformer decoder made from a stack of 4 decoder lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 366.056, "r_x1": 545.115, "r_y1": 366.056, "r_x2": 545.115, "r_y2": 357.504, "r_x3": 308.862, "r_y3": 357.504, "coord_origin": "TOPLEFT"}, "text": "ers that comprise mainly of multi-head attention and feed", "orig": "ers that comprise mainly of multi-head attention and feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 378.011, "r_x1": 370.391, "r_y1": 378.011, "r_x2": 370.391, "r_y2": 369.459, "r_x3": 308.862, "r_y3": 369.459, "coord_origin": "TOPLEFT"}, "text": "forward layers.", "orig": "forward layers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.445, "r_y0": 378.011, "r_x1": 545.115, "r_y1": 378.011, "r_x2": 545.115, "r_y2": 369.459, "r_x3": 377.445, "r_y3": 369.459, "coord_origin": "TOPLEFT"}, "text": "This configuration uses fewer layers and", "orig": "This configuration uses fewer layers and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 389.966, "r_x1": 545.115, "r_y1": 389.966, "r_x2": 545.115, "r_y2": 381.414, "r_x3": 308.862, "r_y3": 381.414, "coord_origin": "TOPLEFT"}, "text": "heads in comparison to networks applied to other problems", "orig": "heads in comparison to networks applied to other problems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 401.921, "r_x1": 326.566, "r_y1": 401.921, "r_x2": 326.566, "r_y2": 393.369, "r_x3": 308.862, "r_y3": 393.369, "coord_origin": "TOPLEFT"}, "text": "(e.g.", "orig": "(e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 331.069, "r_y0": 401.921, "r_x1": 545.115, "r_y1": 401.921, "r_x2": 545.115, "r_y2": 393.369, "r_x3": 331.069, "r_y3": 393.369, "coord_origin": "TOPLEFT"}, "text": "'Scene Understanding', 'Image Captioning'), some-", "orig": "'Scene Understanding', 'Image Captioning'), some-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 413.876, "r_x1": 528.019, "r_y1": 413.876, "r_x2": 528.019, "r_y2": 405.324, "r_x3": 308.862, "r_y3": 405.324, "coord_origin": "TOPLEFT"}, "text": "thing which we relate to the simplicity of table images.", "orig": "thing which we relate to the simplicity of table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Structure Decoder. The transformer architecture of this component is based on the work proposed in [31]. After extensive experimentation, the Structure Decoder is modeled as a transformer encoder with two encoder layers and a transformer decoder made from a stack of 4 decoder layers that comprise mainly of multi-head attention and feed forward layers. This configuration uses fewer layers and heads in comparison to networks applied to other problems (e.g. 'Scene Understanding', 'Image Captioning'), something which we relate to the simplicity of table images."}, {"label": "text", "id": 3, "page_no": 4, "cluster": {"id": 3, "label": "text", "bbox": {"l": 308.862, "t": 417.383, "r": 545.115, "b": 545.487, "coord_origin": "TOPLEFT"}, "confidence": 0.9851906895637512, "cells": [{"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 425.935, "r_x1": 336.309, "r_y1": 425.935, "r_x2": 336.309, "r_y2": 417.383, "r_x3": 320.817, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "The", "orig": "The", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 341.579, "r_y0": 425.935, "r_x1": 388.055, "r_y1": 425.935, "r_x2": 388.055, "r_y2": 417.383, "r_x3": 341.579, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "transformer", "orig": "transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.325, "r_y0": 425.935, "r_x1": 424.856, "r_y1": 425.935, "r_x2": 424.856, "r_y2": 417.383, "r_x3": 393.325, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "encoder", "orig": "encoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.117, "r_y0": 425.935, "r_x1": 462.356, "r_y1": 425.935, "r_x2": 462.356, "r_y2": 417.383, "r_x3": 430.117, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "receives", "orig": "receives", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 467.626, "r_y0": 425.935, "r_x1": 477.031, "r_y1": 425.935, "r_x2": 477.031, "r_y2": 417.383, "r_x3": 467.626, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "an", "orig": "an", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 482.301, "r_y0": 425.935, "r_x1": 515.496, "r_y1": 425.935, "r_x2": 515.496, "r_y2": 417.383, "r_x3": 482.301, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "encoded", "orig": "encoded", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 520.766, "r_y0": 425.935, "r_x1": 545.115, "r_y1": 425.935, "r_x2": 545.115, "r_y2": 417.383, "r_x3": 520.766, "r_y3": 417.383, "coord_origin": "TOPLEFT"}, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 437.89, "r_x1": 343.721, "r_y1": 437.89, "r_x2": 343.721, "r_y2": 429.338, "r_x3": 308.862, "r_y3": 429.338, "coord_origin": "TOPLEFT"}, "text": "from the", "orig": "from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.038, "r_y0": 437.747, "r_x1": 446.455, "r_y1": 437.747, "r_x2": 446.455, "r_y2": 429.159, "r_x3": 347.038, "r_y3": 429.159, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.94, "r_y0": 437.89, "r_x1": 545.113, "r_y1": 437.89, "r_x2": 545.113, "r_y2": 429.338, "r_x3": 449.94, "r_y3": 429.338, "coord_origin": "TOPLEFT"}, "text": "and refines it through a", "orig": "and refines it through a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 449.845, "r_x1": 545.115, "r_y1": 449.845, "r_x2": 545.115, "r_y2": 441.293, "r_x3": 308.862, "r_y3": 441.293, "coord_origin": "TOPLEFT"}, "text": "multi-head dot-product attention layer, followed by a Feed", "orig": "multi-head dot-product attention layer, followed by a Feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 461.8, "r_x1": 384.149, "r_y1": 461.8, "r_x2": 384.149, "r_y2": 453.248, "r_x3": 308.862, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "Forward Network.", "orig": "Forward Network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.375, "r_y0": 461.8, "r_x1": 459.616, "r_y1": 461.8, "r_x2": 459.616, "r_y2": 453.248, "r_x3": 393.375, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "During training,", "orig": "During training,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 464.667, "r_y0": 461.8, "r_x1": 476.841, "r_y1": 461.8, "r_x2": 476.841, "r_y2": 453.248, "r_x3": 464.667, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 481.374, "r_y0": 461.8, "r_x1": 527.85, "r_y1": 461.8, "r_x2": 527.85, "r_y2": 453.248, "r_x3": 481.374, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "transformer", "orig": "transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.393, "r_y0": 461.8, "r_x1": 545.115, "r_y1": 461.8, "r_x2": 545.115, "r_y2": 453.248, "r_x3": 532.393, "r_y3": 453.248, "coord_origin": "TOPLEFT"}, "text": "de-", "orig": "de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 473.756, "r_x1": 545.115, "r_y1": 473.756, "r_x2": 545.115, "r_y2": 465.204, "r_x3": 308.862, "r_y3": 465.204, "coord_origin": "TOPLEFT"}, "text": "coder receives as input the output feature produced by the", "orig": "coder receives as input the output feature produced by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 485.711, "r_x1": 545.115, "r_y1": 485.711, "r_x2": 545.115, "r_y2": 477.159, "r_x3": 308.862, "r_y3": 477.159, "coord_origin": "TOPLEFT"}, "text": "transformer encoder, and the tokenized input of the HTML", "orig": "transformer encoder, and the tokenized input of the HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 497.666, "r_x1": 545.115, "r_y1": 497.666, "r_x2": 545.115, "r_y2": 489.114, "r_x3": 308.862, "r_y3": 489.114, "coord_origin": "TOPLEFT"}, "text": "ground-truth tags. Using a stack of multi-head attention lay-", "orig": "ground-truth tags. Using a stack of multi-head attention lay-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 509.621, "r_x1": 545.115, "r_y1": 509.621, "r_x2": 545.115, "r_y2": 501.069, "r_x3": 308.862, "r_y3": 501.069, "coord_origin": "TOPLEFT"}, "text": "ers, different aspects of the tag sequence could be inferred.", "orig": "ers, different aspects of the tag sequence could be inferred.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 521.576, "r_x1": 545.115, "r_y1": 521.576, "r_x2": 545.115, "r_y2": 513.024, "r_x3": 308.862, "r_y3": 513.024, "coord_origin": "TOPLEFT"}, "text": "This is achieved by each attention head on a layer operating", "orig": "This is achieved by each attention head on a layer operating", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.5319999999999, "r_x1": 545.115, "r_y1": 533.5319999999999, "r_x2": 545.115, "r_y2": 524.98, "r_x3": 308.862, "r_y3": 524.98, "coord_origin": "TOPLEFT"}, "text": "in a different subspace, and then combining altogether their", "orig": "in a different subspace, and then combining altogether their", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.487, "r_x1": 369.733, "r_y1": 545.487, "r_x2": 369.733, "r_y2": 536.935, "r_x3": 308.862, "r_y3": 536.935, "coord_origin": "TOPLEFT"}, "text": "attention score.", "orig": "attention score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The transformer encoder receives an encoded image from the CNN Backbone Network and refines it through a multi-head dot-product attention layer, followed by a Feed Forward Network. During training, the transformer decoder receives as input the output feature produced by the transformer encoder, and the tokenized input of the HTML ground-truth tags. Using a stack of multi-head attention layers, different aspects of the tag sequence could be inferred. This is achieved by each attention head on a layer operating in a different subspace, and then combining altogether their attention score."}, {"label": "text", "id": 0, "page_no": 4, "cluster": {"id": 0, "label": "text", "bbox": {"l": 308.862, "t": 548.605, "r": 545.115, "b": 653.187, "coord_origin": "TOPLEFT"}, "confidence": 0.9869195818901062, "cells": [{"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 557.561, "r_x1": 404.762, "r_y1": 557.561, "r_x2": 404.762, "r_y2": 548.605, "r_x3": 320.817, "r_y3": 548.605, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder.", "orig": "Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.341, "r_y0": 557.545, "r_x1": 545.115, "r_y1": 557.545, "r_x2": 545.115, "r_y2": 548.9929999999999, "r_x3": 410.341, "r_y3": 548.9929999999999, "coord_origin": "TOPLEFT"}, "text": "Our architecture allows to simul-", "orig": "Our architecture allows to simul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.501, "r_x1": 545.115, "r_y1": 569.501, "r_x2": 545.115, "r_y2": 560.9490000000001, "r_x3": 308.862, "r_y3": 560.9490000000001, "coord_origin": "TOPLEFT"}, "text": "taneously predict HTML tags and bounding boxes for each", "orig": "taneously predict HTML tags and bounding boxes for each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 581.456, "r_x1": 545.115, "r_y1": 581.456, "r_x2": 545.115, "r_y2": 572.904, "r_x3": 308.862, "r_y3": 572.904, "coord_origin": "TOPLEFT"}, "text": "table cell without the need of a separate object detector end", "orig": "table cell without the need of a separate object detector end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 593.4110000000001, "r_x1": 336.458, "r_y1": 593.4110000000001, "r_x2": 336.458, "r_y2": 584.859, "r_x3": 308.862, "r_y3": 584.859, "coord_origin": "TOPLEFT"}, "text": "to end.", "orig": "to end.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.971, "r_y0": 593.4110000000001, "r_x1": 545.115, "r_y1": 593.4110000000001, "r_x2": 545.115, "r_y2": 584.859, "r_x3": 340.971, "r_y3": 584.859, "coord_origin": "TOPLEFT"}, "text": "This approach is inspired by DETR [1] which em-", "orig": "This approach is inspired by DETR [1] which em-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.366, "r_x1": 545.115, "r_y1": 605.366, "r_x2": 545.115, "r_y2": 596.814, "r_x3": 308.862, "r_y3": 596.814, "coord_origin": "TOPLEFT"}, "text": "ploys a Transformer Encoder, and Decoder that looks for", "orig": "ploys a Transformer Encoder, and Decoder that looks for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.321, "r_x1": 545.115, "r_y1": 617.321, "r_x2": 545.115, "r_y2": 608.769, "r_x3": 308.862, "r_y3": 608.769, "coord_origin": "TOPLEFT"}, "text": "a specific number of object queries (potential object detec-", "orig": "a specific number of object queries (potential object detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.2760000000001, "r_x1": 545.115, "r_y1": 629.2760000000001, "r_x2": 545.115, "r_y2": 620.7239999999999, "r_x3": 308.862, "r_y3": 620.7239999999999, "coord_origin": "TOPLEFT"}, "text": "tions). As our model utilizes a transformer architecture, the", "orig": "tions). As our model utilizes a transformer architecture, the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.232, "r_x1": 381.679, "r_y1": 641.232, "r_x2": 381.679, "r_y2": 632.6800000000001, "r_x3": 308.862, "r_y3": 632.6800000000001, "coord_origin": "TOPLEFT"}, "text": "hidden state of the", "orig": "hidden state of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 383.997, "r_y0": 641.068, "r_x1": 391.746, "r_y1": 641.068, "r_x2": 391.746, "r_y2": 632.362, "r_x3": 383.997, "r_y3": 632.362, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.746, "r_y0": 641.232, "r_x1": 399.497, "r_y1": 641.232, "r_x2": 399.497, "r_y2": 632.6800000000001, "r_x3": 391.746, "r_y3": 632.6800000000001, "coord_origin": "TOPLEFT"}, "text": "td", "orig": "td", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 399.497, "r_y0": 641.068, "r_x1": 407.246, "r_y1": 641.068, "r_x2": 407.246, "r_y2": 632.362, "r_x3": 399.497, "r_y3": 632.362, "coord_origin": "TOPLEFT"}, "text": ">", "orig": ">", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 407.246, "r_y0": 641.232, "r_x1": 432.91, "r_y1": 641.232, "r_x2": 432.91, "r_y2": 632.6800000000001, "r_x3": 407.246, "r_y3": 632.6800000000001, "coord_origin": "TOPLEFT"}, "text": "' and '", "orig": "' and '", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 432.908, "r_y0": 641.068, "r_x1": 440.657, "r_y1": 641.068, "r_x2": 440.657, "r_y2": 632.362, "r_x3": 432.908, "r_y3": 632.362, "coord_origin": "TOPLEFT"}, "text": "<", "orig": "<", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.657, "r_y0": 641.232, "r_x1": 545.115, "r_y1": 641.232, "r_x2": 545.115, "r_y2": 632.6800000000001, "r_x3": 440.657, "r_y3": 632.6800000000001, "coord_origin": "TOPLEFT"}, "text": "' HTMLstructure tags be-", "orig": "' HTMLstructure tags be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.187, "r_x1": 398.964, "r_y1": 653.187, "r_x2": 398.964, "r_y2": 644.635, "r_x3": 308.862, "r_y3": 644.635, "coord_origin": "TOPLEFT"}, "text": "come the object query.", "orig": "come the object query.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Cell BBox Decoder. Our architecture allows to simultaneously predict HTML tags and bounding boxes for each table cell without the need of a separate object detector end to end. This approach is inspired by DETR [1] which employs a Transformer Encoder, and Decoder that looks for a specific number of object queries (potential object detections). As our model utilizes a transformer architecture, the hidden state of the < td > ' and ' < ' HTMLstructure tags become the object query."}, {"label": "text", "id": 2, "page_no": 4, "cluster": {"id": 2, "label": "text", "bbox": {"l": 308.862, "t": 656.515, "r": 545.115, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9852352142333984, "cells": [{"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 665.246, "r_x1": 444.343, "r_y1": 665.246, "r_x2": 444.343, "r_y2": 656.694, "r_x3": 320.817, "r_y3": 656.694, "coord_origin": "TOPLEFT"}, "text": "The encoding generated by the", "orig": "The encoding generated by the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 447.006, "r_y0": 665.103, "r_x1": 545.108, "r_y1": 665.103, "r_x2": 545.108, "r_y2": 656.515, "r_x3": 447.006, "r_y3": 656.515, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network", "orig": "CNN Backbone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 677.201, "r_x1": 545.115, "r_y1": 677.201, "r_x2": 545.115, "r_y2": 668.649, "r_x3": 308.862, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "along with the features acquired for every data cell from the", "orig": "along with the features acquired for every data cell from the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 308.862, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "Transformer Decoder are then passed to the attention net-", "orig": "Transformer Decoder are then passed to the attention net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "work. The attention network takes both inputs and learns to", "orig": "work. The attention network takes both inputs and learns to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 203, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 470.425, "r_y1": 713.066, "r_x2": 470.425, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "provide an attention weighted encoding.", "orig": "provide an attention weighted encoding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 204, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 474.63, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 474.63, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "This weighted at-", "orig": "This weighted at-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The encoding generated by the CNN Backbone Network along with the features acquired for every data cell from the Transformer Decoder are then passed to the attention network. The attention network takes both inputs and learns to provide an attention weighted encoding. This weighted at-"}], "headers": [{"label": "page_footer", "id": 9, "page_no": 4, "cluster": {"id": 9, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8719564080238342, "cells": [{"index": 205, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5"}]}}, {"page_no": 5, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "tention encoding is then multiplied to the encoded image to", "orig": "tention encoding is then multiplied to the encoded image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 95.98400000000004, "r_x1": 286.365, "r_y1": 95.98400000000004, "r_x2": 286.365, "r_y2": 87.43200000000002, "r_x3": 50.112, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "produce a feature for each table cell. Notice that this is dif-", "orig": "produce a feature for each table cell. Notice that this is dif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 107.93899999999996, "r_x1": 286.365, "r_y1": 107.93899999999996, "r_x2": 286.365, "r_y2": 99.38699999999994, "r_x3": 50.112, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "ferent than the typical object detection problem where im-", "orig": "ferent than the typical object detection problem where im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 119.894, "r_x1": 286.365, "r_y1": 119.894, "r_x2": 286.365, "r_y2": 111.34199999999998, "r_x3": 50.112, "r_y3": 111.34199999999998, "coord_origin": "TOPLEFT"}, "text": "balances between the number of detections and the amount", "orig": "balances between the number of detections and the amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 131.84900000000005, "r_x1": 135.691, "r_y1": 131.84900000000005, "r_x2": 135.691, "r_y2": 123.29700000000003, "r_x3": 50.112, "r_y3": 123.29700000000003, "coord_origin": "TOPLEFT"}, "text": "of objects may exist.", "orig": "of objects may exist.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.047, "r_y0": 131.84900000000005, "r_x1": 286.365, "r_y1": 131.84900000000005, "r_x2": 286.365, "r_y2": 123.29700000000003, "r_x3": 142.047, "r_y3": 123.29700000000003, "coord_origin": "TOPLEFT"}, "text": "In our case, we know up front that", "orig": "In our case, we know up front that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 143.80499999999995, "r_x1": 286.365, "r_y1": 143.80499999999995, "r_x2": 286.365, "r_y2": 135.25300000000004, "r_x3": 50.112, "r_y3": 135.25300000000004, "coord_origin": "TOPLEFT"}, "text": "the produced detections always match with the table cells", "orig": "the produced detections always match with the table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 155.76, "r_x1": 175.163, "r_y1": 155.76, "r_x2": 175.163, "r_y2": 147.20799999999997, "r_x3": 50.112, "r_y3": 147.20799999999997, "coord_origin": "TOPLEFT"}, "text": "in number and correspondence.", "orig": "in number and correspondence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 168.44500000000005, "r_x1": 108.154, "r_y1": 168.44500000000005, "r_x2": 108.154, "r_y2": 159.89300000000003, "r_x3": 62.067, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "The output", "orig": "The output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.275, "r_y0": 168.44500000000005, "r_x1": 144.806, "r_y1": 168.44500000000005, "r_x2": 144.806, "r_y2": 159.89300000000003, "r_x3": 113.275, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "features", "orig": "features", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.937, "r_y0": 168.44500000000005, "r_x1": 161.554, "r_y1": 168.44500000000005, "r_x2": 161.554, "r_y2": 159.89300000000003, "r_x3": 149.937, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.684, "r_y0": 168.44500000000005, "r_x1": 184.936, "r_y1": 168.44500000000005, "r_x2": 184.936, "r_y2": 159.89300000000003, "r_x3": 166.684, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "each", "orig": "each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 190.057, "r_y0": 168.44500000000005, "r_x1": 209.424, "r_y1": 168.44500000000005, "r_x2": 209.424, "r_y2": 159.89300000000003, "r_x3": 190.057, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.555, "r_y0": 168.44500000000005, "r_x1": 228.941, "r_y1": 168.44500000000005, "r_x2": 228.941, "r_y2": 159.89300000000003, "r_x3": 214.555, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "cell", "orig": "cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.061, "r_y0": 168.44500000000005, "r_x1": 246.226, "r_y1": 168.44500000000005, "r_x2": 246.226, "r_y2": 159.89300000000003, "r_x3": 234.061, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "are", "orig": "are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.356, "r_y0": 168.44500000000005, "r_x1": 268.512, "r_y1": 168.44500000000005, "r_x2": 268.512, "r_y2": 159.89300000000003, "r_x3": 251.356, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "then", "orig": "then", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 273.643, "r_y0": 168.44500000000005, "r_x1": 286.365, "r_y1": 168.44500000000005, "r_x2": 286.365, "r_y2": 159.89300000000003, "r_x3": 273.643, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "fed", "orig": "fed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 180.40099999999995, "r_x1": 65.614, "r_y1": 180.40099999999995, "r_x2": 65.614, "r_y2": 171.84900000000005, "r_x3": 50.112, "r_y3": 171.84900000000005, "coord_origin": "TOPLEFT"}, "text": "into", "orig": "into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.107, "r_y0": 180.40099999999995, "r_x1": 82.281, "r_y1": 180.40099999999995, "r_x2": 82.281, "r_y2": 171.84900000000005, "r_x3": 70.107, "r_y3": 171.84900000000005, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.764, "r_y0": 180.40099999999995, "r_x1": 138.66, "r_y1": 180.40099999999995, "r_x2": 138.66, "r_y2": 171.84900000000005, "r_x3": 86.764, "r_y3": 171.84900000000005, "coord_origin": "TOPLEFT"}, "text": "feed-forward", "orig": "feed-forward", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.153, "r_y0": 180.40099999999995, "r_x1": 286.365, "r_y1": 180.40099999999995, "r_x2": 286.365, "r_y2": 171.84900000000005, "r_x3": 143.153, "r_y3": 171.84900000000005, "coord_origin": "TOPLEFT"}, "text": "network (FFN). The FFN consists", "orig": "network (FFN). The FFN consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 192.356, "r_x1": 286.365, "r_y1": 192.356, "r_x2": 286.365, "r_y2": 183.80399999999997, "r_x3": 50.112, "r_y3": 183.80399999999997, "coord_origin": "TOPLEFT"}, "text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 204.31100000000004, "r_x1": 286.365, "r_y1": 204.31100000000004, "r_x2": 286.365, "r_y2": 195.75900000000001, "r_x3": 50.112, "r_y3": 195.75900000000001, "coord_origin": "TOPLEFT"}, "text": "tion function) that predicts the normalized coordinates for", "orig": "tion function) that predicts the normalized coordinates for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 216.26599999999996, "r_x1": 196.004, "r_y1": 216.26599999999996, "r_x2": 196.004, "r_y2": 207.71400000000006, "r_x3": 50.112, "r_y3": 207.71400000000006, "coord_origin": "TOPLEFT"}, "text": "the bounding box of each table cell.", "orig": "the bounding box of each table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.786, "r_y0": 216.26599999999996, "r_x1": 286.365, "r_y1": 216.26599999999996, "r_x2": 286.365, "r_y2": 207.71400000000006, "r_x3": 200.786, "r_y3": 207.71400000000006, "coord_origin": "TOPLEFT"}, "text": "Finally, the predicted", "orig": "Finally, the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 228.221, "r_x1": 286.365, "r_y1": 228.221, "r_x2": 286.365, "r_y2": 219.66899999999998, "r_x3": 50.112, "r_y3": 219.66899999999998, "coord_origin": "TOPLEFT"}, "text": "bounding boxes are classified based on whether they are", "orig": "bounding boxes are classified based on whether they are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 240.17700000000002, "r_x1": 181.549, "r_y1": 240.17700000000002, "r_x2": 181.549, "r_y2": 231.625, "r_x3": 50.112, "r_y3": 231.625, "coord_origin": "TOPLEFT"}, "text": "empty or not using a linear layer.", "orig": "empty or not using a linear layer.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 252.87800000000004, "r_x1": 129.215, "r_y1": 252.87800000000004, "r_x2": 129.215, "r_y2": 243.92200000000003, "r_x3": 62.067, "r_y3": 243.92200000000003, "coord_origin": "TOPLEFT"}, "text": "Loss Functions.", "orig": "Loss Functions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.451, "r_y0": 252.86199999999997, "r_x1": 276.139, "r_y1": 252.86199999999997, "r_x2": 276.139, "r_y2": 244.30999999999995, "r_x3": 134.451, "r_y3": 244.30999999999995, "coord_origin": "TOPLEFT"}, "text": "We formulate a multi-task loss Eq.", "orig": "We formulate a multi-task loss Eq.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.379, "r_y0": 252.86199999999997, "r_x1": 286.361, "r_y1": 252.86199999999997, "r_x2": 286.361, "r_y2": 244.30999999999995, "r_x3": 281.379, "r_y3": 244.30999999999995, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 264.817, "r_x1": 134.685, "r_y1": 264.817, "r_x2": 134.685, "r_y2": 256.265, "r_x3": 50.112, "r_y3": 256.265, "coord_origin": "TOPLEFT"}, "text": "to train our network.", "orig": "to train our network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.543, "r_y0": 264.817, "r_x1": 286.365, "r_y1": 264.817, "r_x2": 286.365, "r_y2": 256.265, "r_x3": 140.543, "r_y3": 256.265, "coord_origin": "TOPLEFT"}, "text": "The Cross-Entropy loss (denoted as", "orig": "The Cross-Entropy loss (denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 276.60900000000004, "r_x1": 53.085, "r_y1": 276.60900000000004, "r_x2": 53.085, "r_y2": 267.903, "r_x3": 50.112, "r_y3": 267.903, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.085, "r_y0": 277.53200000000004, "r_x1": 56.845, "r_y1": 277.53200000000004, "r_x2": 56.845, "r_y2": 271.438, "r_x3": 53.085, "r_y3": 271.438, "coord_origin": "TOPLEFT"}, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 57.343, "r_y0": 276.773, "r_x1": 135.4, "r_y1": 276.773, "r_x2": 135.4, "r_y2": 268.221, "r_x3": 57.343, "r_y3": 268.221, "coord_origin": "TOPLEFT"}, "text": ") is used to train the", "orig": ") is used to train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.735, "r_y0": 276.63, "r_x1": 211.08, "r_y1": 276.63, "r_x2": 211.08, "r_y2": 268.04200000000003, "r_x3": 137.735, "r_y3": 268.04200000000003, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 213.637, "r_y0": 276.773, "r_x1": 286.364, "r_y1": 276.773, "r_x2": 286.364, "r_y2": 268.221, "r_x3": 213.637, "r_y3": 268.221, "coord_origin": "TOPLEFT"}, "text": "which predicts the", "orig": "which predicts the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 288.728, "r_x1": 158.824, "r_y1": 288.728, "r_x2": 158.824, "r_y2": 280.176, "r_x3": 50.112, "r_y3": 280.176, "coord_origin": "TOPLEFT"}, "text": "structure tokens. As for the", "orig": "structure tokens. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.318, "r_y0": 288.585, "r_x1": 238.797, "r_y1": 288.585, "r_x2": 238.797, "r_y2": 279.99699999999996, "r_x3": 161.318, "r_y3": 279.99699999999996, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.521, "r_y0": 288.728, "r_x1": 286.363, "r_y1": 288.728, "r_x2": 286.363, "r_y2": 280.176, "r_x3": 241.521, "r_y3": 280.176, "coord_origin": "TOPLEFT"}, "text": "it is trained", "orig": "it is trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 300.683, "r_x1": 211.377, "r_y1": 300.683, "r_x2": 211.377, "r_y2": 292.131, "r_x3": 50.112, "r_y3": 292.131, "coord_origin": "TOPLEFT"}, "text": "with a combination of losses denoted as", "orig": "with a combination of losses denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.271, "r_y0": 300.519, "r_x1": 217.244, "r_y1": 300.519, "r_x2": 217.244, "r_y2": 291.813, "r_x3": 214.271, "r_y3": 291.813, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.244, "r_y0": 301.442, "r_x1": 229.198, "r_y1": 301.442, "r_x2": 229.198, "r_y2": 295.348, "r_x3": 217.244, "r_y3": 295.348, "coord_origin": "TOPLEFT"}, "text": "box", "orig": "box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.696, "r_y0": 300.683, "r_x1": 232.187, "r_y1": 300.683, "r_x2": 232.187, "r_y2": 292.131, "r_x3": 229.696, "r_y3": 292.131, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.49, "r_y0": 300.519, "r_x1": 239.463, "r_y1": 300.519, "r_x2": 239.463, "r_y2": 291.813, "r_x3": 236.49, "r_y3": 291.813, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.463, "r_y0": 301.442, "r_x1": 251.417, "r_y1": 301.442, "r_x2": 251.417, "r_y2": 295.348, "r_x3": 239.463, "r_y3": 295.348, "coord_origin": "TOPLEFT"}, "text": "box", "orig": "box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 254.811, "r_y0": 300.683, "r_x1": 286.363, "r_y1": 300.683, "r_x2": 286.363, "r_y2": 292.131, "r_x3": 254.811, "r_y3": 292.131, "coord_origin": "TOPLEFT"}, "text": "consists", "orig": "consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 312.638, "r_x1": 137.454, "r_y1": 312.638, "r_x2": 137.454, "r_y2": 304.086, "r_x3": 50.112, "r_y3": 304.086, "coord_origin": "TOPLEFT"}, "text": "of the generally used", "orig": "of the generally used", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.298, "r_y0": 312.474, "r_x1": 144.271, "r_y1": 312.474, "r_x2": 144.271, "r_y2": 303.768, "r_x3": 141.298, "r_y3": 303.768, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 144.271, "r_y0": 313.398, "r_x1": 148.243, "r_y1": 313.398, "r_x2": 148.243, "r_y2": 307.304, "r_x3": 144.271, "r_y3": 307.304, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.586, "r_y0": 312.638, "r_x1": 286.364, "r_y1": 312.638, "r_x2": 286.364, "r_y2": 304.086, "r_x3": 152.586, "r_y3": 304.086, "coord_origin": "TOPLEFT"}, "text": "loss for object detection and the", "orig": "loss for object detection and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 324.593, "r_x1": 89.683, "r_y1": 324.593, "r_x2": 89.683, "r_y2": 316.041, "r_x3": 50.112, "r_y3": 316.041, "coord_origin": "TOPLEFT"}, "text": "IoU loss (", "orig": "IoU loss (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 89.686, "r_y0": 324.429, "r_x1": 92.659, "r_y1": 324.429, "r_x2": 92.659, "r_y2": 315.723, "r_x3": 89.686, "r_y3": 315.723, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.659, "r_y0": 325.353, "r_x1": 104.12, "r_y1": 325.353, "r_x2": 104.12, "r_y2": 319.259, "r_x3": 92.659, "r_y3": 319.259, "coord_origin": "TOPLEFT"}, "text": "iou", "orig": "iou", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 104.618, "r_y0": 324.593, "r_x1": 286.366, "r_y1": 324.593, "r_x2": 286.366, "r_y2": 316.041, "r_x3": 104.618, "r_y3": 316.041, "coord_origin": "TOPLEFT"}, "text": ") to be scale invariant as explained in [25]. In", "orig": ") to be scale invariant as explained in [25]. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 336.549, "r_x1": 286.365, "r_y1": 336.549, "r_x2": 286.365, "r_y2": 327.997, "r_x3": 50.112, "r_y3": 327.997, "coord_origin": "TOPLEFT"}, "text": "comparison to DETR, we do not use the Hungarian algo-", "orig": "comparison to DETR, we do not use the Hungarian algo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 348.504, "r_x1": 286.365, "r_y1": 348.504, "r_x2": 286.365, "r_y2": 339.952, "r_x3": 50.112, "r_y3": 339.952, "coord_origin": "TOPLEFT"}, "text": "rithm [15] to match the predicted bounding boxes with the", "orig": "rithm [15] to match the predicted bounding boxes with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 360.459, "r_x1": 286.365, "r_y1": 360.459, "r_x2": 286.365, "r_y2": 351.907, "r_x3": 50.112, "r_y3": 351.907, "coord_origin": "TOPLEFT"}, "text": "ground-truth boxes, as we have already achieved a one-to-", "orig": "ground-truth boxes, as we have already achieved a one-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 372.414, "r_x1": 286.365, "r_y1": 372.414, "r_x2": 286.365, "r_y2": 363.862, "r_x3": 50.112, "r_y3": 363.862, "coord_origin": "TOPLEFT"}, "text": "one match through two steps: 1) Our token input sequence", "orig": "one match through two steps: 1) Our token input sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 384.369, "r_x1": 286.365, "r_y1": 384.369, "r_x2": 286.365, "r_y2": 375.817, "r_x3": 50.112, "r_y3": 375.817, "coord_origin": "TOPLEFT"}, "text": "is naturally ordered, therefore the hidden states of the table", "orig": "is naturally ordered, therefore the hidden states of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 396.324, "r_x1": 286.365, "r_y1": 396.324, "r_x2": 286.365, "r_y2": 387.772, "r_x3": 50.112, "r_y3": 387.772, "coord_origin": "TOPLEFT"}, "text": "data cells are also in order when they are provided as in-", "orig": "data cells are also in order when they are provided as in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 408.28, "r_x1": 88.687, "r_y1": 408.28, "r_x2": 88.687, "r_y2": 399.728, "r_x3": 50.112, "r_y3": 399.728, "coord_origin": "TOPLEFT"}, "text": "put to the", "orig": "put to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.646, "r_y0": 408.137, "r_x1": 170.052, "r_y1": 408.137, "r_x2": 170.052, "r_y2": 399.549, "r_x3": 91.646, "r_y3": 399.549, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.051, "r_y0": 408.28, "r_x1": 172.542, "r_y1": 408.28, "r_x2": 172.542, "r_y2": 399.728, "r_x3": 170.051, "r_y3": 399.728, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.62, "r_y0": 408.28, "r_x1": 286.364, "r_y1": 408.28, "r_x2": 286.364, "r_y2": 399.728, "r_x3": 175.62, "r_y3": 399.728, "coord_origin": "TOPLEFT"}, "text": "and 2) Our bounding boxes", "orig": "and 2) Our bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 420.235, "r_x1": 181.967, "r_y1": 420.235, "r_x2": 181.967, "r_y2": 411.683, "r_x3": 50.112, "r_y3": 411.683, "coord_origin": "TOPLEFT"}, "text": "generation mechanism (see Sec.", "orig": "generation mechanism (see Sec.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 189.09, "r_y0": 420.235, "r_x1": 286.365, "r_y1": 420.235, "r_x2": 286.365, "r_y2": 411.683, "r_x3": 189.09, "r_y3": 411.683, "coord_origin": "TOPLEFT"}, "text": "3) ensures a one-to-one", "orig": "3) ensures a one-to-one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 432.19, "r_x1": 286.365, "r_y1": 432.19, "r_x2": 286.365, "r_y2": 423.638, "r_x3": 50.112, "r_y3": 423.638, "coord_origin": "TOPLEFT"}, "text": "mapping between the cell content and its bounding box for", "orig": "mapping between the cell content and its bounding box for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 444.145, "r_x1": 158.296, "r_y1": 444.145, "r_x2": 158.296, "r_y2": 435.593, "r_x3": 50.112, "r_y3": 435.593, "coord_origin": "TOPLEFT"}, "text": "all post-processed datasets.", "orig": "all post-processed datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 456.831, "r_x1": 286.365, "r_y1": 456.831, "r_x2": 286.365, "r_y2": 448.279, "r_x3": 62.067, "r_y3": 448.279, "coord_origin": "TOPLEFT"}, "text": "The loss used to train the TableFormer can be defined as", "orig": "The loss used to train the TableFormer can be defined as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 468.786, "r_x1": 91.377, "r_y1": 468.786, "r_x2": 91.377, "r_y2": 460.234, "r_x3": 50.112, "r_y3": 460.234, "coord_origin": "TOPLEFT"}, "text": "following:", "orig": "following:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.715, "r_y0": 502.097, "r_x1": 128.688, "r_y1": 502.097, "r_x2": 128.688, "r_y2": 493.391, "r_x3": 125.715, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.688, "r_y0": 503.02, "r_x1": 140.642, "r_y1": 503.02, "r_x2": 140.642, "r_y2": 496.926, "r_x3": 128.688, "r_y3": 496.926, "coord_origin": "TOPLEFT"}, "text": "box", "orig": "box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.907, "r_y0": 502.097, "r_x1": 151.656, "r_y1": 502.097, "r_x2": 151.656, "r_y2": 493.391, "r_x3": 143.907, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.423, "r_y0": 502.097, "r_x1": 160.234, "r_y1": 502.097, "r_x2": 160.234, "r_y2": 493.391, "r_x3": 154.423, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.235, "r_y0": 503.02, "r_x1": 186.628, "r_y1": 503.02, "r_x2": 186.628, "r_y2": 496.926, "r_x3": 160.235, "r_y3": 496.926, "coord_origin": "TOPLEFT"}, "text": "iou iou", "orig": "iou iou", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.194, "r_y0": 502.097, "r_x1": 175.167, "r_y1": 502.097, "r_x2": 175.167, "r_y2": 493.391, "r_x3": 172.194, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 189.34, "r_y0": 502.097, "r_x1": 197.089, "r_y1": 502.097, "r_x2": 197.089, "r_y2": 493.391, "r_x3": 189.34, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "+", "orig": "+", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.303, "r_y0": 502.097, "r_x1": 205.114, "r_y1": 502.097, "r_x2": 205.114, "r_y2": 493.391, "r_x3": 199.303, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 205.115, "r_y0": 503.02, "r_x1": 207.635, "r_y1": 503.02, "r_x2": 207.635, "r_y2": 496.926, "r_x3": 205.115, "r_y3": 496.926, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.675, "r_y0": 503.02, "r_x1": 211.647, "r_y1": 503.02, "r_x2": 211.647, "r_y2": 496.926, "r_x3": 207.675, "r_y3": 496.926, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.33, "r_y0": 517.0409999999999, "r_x1": 127.303, "r_y1": 517.0409999999999, "r_x2": 127.303, "r_y2": 508.335, "r_x3": 124.33, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 130.266, "r_y0": 517.0409999999999, "r_x1": 138.015, "r_y1": 517.0409999999999, "r_x2": 138.015, "r_y2": 508.335, "r_x3": 130.266, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.782, "r_y0": 517.0409999999999, "r_x1": 149.566, "r_y1": 517.0409999999999, "r_x2": 149.566, "r_y2": 508.335, "r_x3": 140.782, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "\u03bbl", "orig": "\u03bbl", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.566, "r_y0": 517.9639999999999, "r_x1": 153.326, "r_y1": 517.9639999999999, "r_x2": 153.326, "r_y2": 511.87, "r_x3": 149.566, "r_y3": 511.87, "coord_origin": "TOPLEFT"}, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 156.039, "r_y0": 517.0409999999999, "r_x1": 174.855, "r_y1": 517.0409999999999, "r_x2": 174.855, "r_y2": 508.335, "r_x3": 156.039, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "+(1", "orig": "+(1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.071, "r_y0": 516.899, "r_x1": 184.82, "r_y1": 516.899, "r_x2": 184.82, "r_y2": 508.335, "r_x3": 177.071, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.033, "r_y0": 517.0409999999999, "r_x1": 199.692, "r_y1": 517.0409999999999, "r_x2": 199.692, "r_y2": 508.335, "r_x3": 187.033, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "\u03bb l", "orig": "\u03bb l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 192.845, "r_y0": 517.0409999999999, "r_x1": 196.719, "r_y1": 517.0409999999999, "r_x2": 196.719, "r_y2": 508.335, "r_x3": 192.845, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.692, "r_y0": 517.9639999999999, "r_x1": 211.646, "r_y1": 517.9639999999999, "r_x2": 211.646, "r_y2": 511.87, "r_x3": 199.692, "r_y3": 511.87, "coord_origin": "TOPLEFT"}, "text": "box", "orig": "box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.746, "r_y0": 509.832, "r_x1": 286.362, "r_y1": 509.832, "r_x2": 286.362, "r_y2": 501.28, "r_x3": 274.746, "r_y3": 501.28, "coord_origin": "TOPLEFT"}, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 540.13, "r_x1": 74.451, "r_y1": 540.13, "r_x2": 74.451, "r_y2": 531.578, "r_x3": 50.112, "r_y3": 531.578, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.941, "r_y0": 539.966, "r_x1": 82.752, "r_y1": 539.966, "r_x2": 82.752, "r_y2": 531.26, "r_x3": 76.941, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.52, "r_y0": 539.8240000000001, "r_x1": 92.162, "r_y1": 539.8240000000001, "r_x2": 92.162, "r_y2": 531.26, "r_x3": 85.52, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": "\u2208", "orig": "\u2208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.653, "r_y0": 540.13, "r_x1": 135.599, "r_y1": 540.13, "r_x2": 135.599, "r_y2": 531.578, "r_x3": 94.653, "r_y3": 531.578, "coord_origin": "TOPLEFT"}, "text": "[0, 1], and", "orig": "[0, 1], and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.09, "r_y0": 539.966, "r_x1": 143.901, "r_y1": 539.966, "r_x2": 143.901, "r_y2": 531.26, "r_x3": 138.09, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.901, "r_y0": 540.889, "r_x1": 155.362, "r_y1": 540.889, "r_x2": 155.362, "r_y2": 534.7950000000001, "r_x3": 143.901, "r_y3": 534.7950000000001, "coord_origin": "TOPLEFT"}, "text": "iou", "orig": "iou", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.861, "r_y0": 539.966, "r_x1": 166.104, "r_y1": 539.966, "r_x2": 166.104, "r_y2": 531.26, "r_x3": 155.861, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": ", \u03bb", "orig": ", \u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.1, "r_y0": 540.889, "r_x1": 168.62, "r_y1": 540.889, "r_x2": 168.62, "r_y2": 534.7950000000001, "r_x3": 166.1, "r_y3": 534.7950000000001, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.66, "r_y0": 540.889, "r_x1": 172.632, "r_y1": 540.889, "r_x2": 172.632, "r_y2": 534.7950000000001, "r_x3": 168.66, "r_y3": 534.7950000000001, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.897, "r_y0": 539.8240000000001, "r_x1": 182.539, "r_y1": 539.8240000000001, "r_x2": 182.539, "r_y2": 531.26, "r_x3": 175.897, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": "\u2208", "orig": "\u2208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.306, "r_y0": 538.064, "r_x1": 192.501, "r_y1": 538.064, "r_x2": 192.501, "r_y2": 533.441, "r_x3": 185.306, "r_y3": 533.441, "coord_origin": "TOPLEFT"}, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.992, "r_y0": 540.13, "r_x1": 281.597, "r_y1": 540.13, "r_x2": 281.597, "r_y2": 531.578, "r_x3": 194.992, "r_y3": 531.578, "coord_origin": "TOPLEFT"}, "text": "are hyper-parameters.", "orig": "are hyper-parameters.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 566.665, "r_x1": 171.983, "r_y1": 566.665, "r_x2": 171.983, "r_y2": 555.917, "r_x3": 50.112, "r_y3": 555.917, "coord_origin": "TOPLEFT"}, "text": "5. Experimental Results", "orig": "5. Experimental Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 586.116, "r_x1": 179.175, "r_y1": 586.116, "r_x2": 179.175, "r_y2": 576.264, "r_x3": 50.112, "r_y3": 576.264, "coord_origin": "TOPLEFT"}, "text": "5.1. Implementation Details", "orig": "5.1. Implementation Details", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 604.5550000000001, "r_x1": 202.978, "r_y1": 604.5550000000001, "r_x2": 202.978, "r_y2": 596.0029999999999, "r_x3": 62.067, "r_y3": 596.0029999999999, "coord_origin": "TOPLEFT"}, "text": "TableFormer uses ResNet-18 as the", "orig": "TableFormer uses ResNet-18 as the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 205.384, "r_y0": 604.412, "r_x1": 286.36, "r_y1": 604.412, "r_x2": 286.36, "r_y2": 595.8240000000001, "r_x3": 205.384, "r_y3": 595.8240000000001, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Net-", "orig": "CNN Backbone Net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 616.367, "r_x1": 70.037, "r_y1": 616.367, "r_x2": 70.037, "r_y2": 607.779, "r_x3": 50.112, "r_y3": 607.779, "coord_origin": "TOPLEFT"}, "text": "work", "orig": "work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 616.51, "r_x1": 72.528, "r_y1": 616.51, "r_x2": 72.528, "r_y2": 607.958, "r_x3": 70.037, "r_y3": 607.958, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 77.14, "r_y0": 616.51, "r_x1": 286.365, "r_y1": 616.51, "r_x2": 286.365, "r_y2": 607.958, "r_x3": 77.14, "r_y3": 607.958, "coord_origin": "TOPLEFT"}, "text": "The input images are resized to 448*448 pixels and", "orig": "The input images are resized to 448*448 pixels and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 628.465, "r_x1": 286.365, "r_y1": 628.465, "r_x2": 286.365, "r_y2": 619.913, "r_x3": 50.112, "r_y3": 619.913, "coord_origin": "TOPLEFT"}, "text": "the feature map has a dimension of 28*28. Additionally, we", "orig": "the feature map has a dimension of 28*28. Additionally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 640.421, "r_x1": 207.033, "r_y1": 640.421, "r_x2": 207.033, "r_y2": 631.869, "r_x3": 50.112, "r_y3": 631.869, "coord_origin": "TOPLEFT"}, "text": "enforce the following input constraints:", "orig": "enforce the following input constraints:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.661, "r_y0": 663.366, "r_x1": 186.017, "r_y1": 663.366, "r_x2": 186.017, "r_y2": 654.814, "r_x3": 91.661, "r_y3": 654.814, "coord_origin": "TOPLEFT"}, "text": "Image width and height", "orig": "Image width and height", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 188.507, "r_y0": 663.06, "r_x1": 196.256, "r_y1": 663.06, "r_x2": 196.256, "r_y2": 654.496, "r_x3": 188.507, "r_y3": 654.496, "coord_origin": "TOPLEFT"}, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.746, "r_y0": 663.366, "r_x1": 244.813, "r_y1": 663.366, "r_x2": 244.813, "r_y2": 654.814, "r_x3": 198.746, "r_y3": 654.814, "coord_origin": "TOPLEFT"}, "text": "1024 pixels", "orig": "1024 pixels", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.016, "r_y0": 678.31, "r_x1": 186.246, "r_y1": 678.31, "r_x2": 186.246, "r_y2": 669.758, "r_x3": 101.016, "r_y3": 669.758, "coord_origin": "TOPLEFT"}, "text": "Structural tags length", "orig": "Structural tags length", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 188.736, "r_y0": 678.004, "r_x1": 196.485, "r_y1": 678.004, "r_x2": 196.485, "r_y2": 669.44, "r_x3": 188.736, "r_y3": 669.44, "coord_origin": "TOPLEFT"}, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.975, "r_y0": 678.31, "r_x1": 244.813, "r_y1": 678.31, "r_x2": 244.813, "r_y2": 669.758, "r_x3": 198.975, "r_y3": 669.758, "coord_origin": "TOPLEFT"}, "text": "512 tokens.", "orig": "512 tokens.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.746, "r_y0": 670.938, "r_x1": 286.362, "r_y1": 670.938, "r_x2": 286.362, "r_y2": 662.386, "r_x3": 274.746, "r_y3": 662.386, "coord_origin": "TOPLEFT"}, "text": "(2)", "orig": "(2)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Although input constraints are used also by other methods,", "orig": "Although input constraints are used also by other methods,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "such as EDD, ours are less restrictive due to the improved", "orig": "such as EDD, ours are less restrictive due to the improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 545.115, "r_y1": 84.029, "r_x2": 545.115, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "runtime performance and lower memory footprint of Table-", "orig": "runtime performance and lower memory footprint of Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 95.98400000000004, "r_x1": 339.985, "r_y1": 95.98400000000004, "r_x2": 339.985, "r_y2": 87.43200000000002, "r_x3": 308.862, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "Former.", "orig": "Former.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.889, "r_y0": 95.98400000000004, "r_x1": 545.115, "r_y1": 95.98400000000004, "r_x2": 545.115, "r_y2": 87.43200000000002, "r_x3": 346.889, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "This allows to utilize input samples with longer", "orig": "This allows to utilize input samples with longer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 107.93899999999996, "r_x1": 492.961, "r_y1": 107.93899999999996, "r_x2": 492.961, "r_y2": 99.38699999999994, "r_x3": 308.862, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "sequences and images with larger dimensions.", "orig": "sequences and images with larger dimensions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 125.04999999999995, "r_x1": 545.115, "r_y1": 125.04999999999995, "r_x2": 545.115, "r_y2": 116.49800000000005, "r_x3": 320.817, "r_y3": 116.49800000000005, "coord_origin": "TOPLEFT"}, "text": "The Transformer Encoder consists of two 'Transformer", "orig": "The Transformer Encoder consists of two 'Transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 137.005, "r_x1": 545.115, "r_y1": 137.005, "r_x2": 545.115, "r_y2": 128.45299999999997, "r_x3": 308.862, "r_y3": 128.45299999999997, "coord_origin": "TOPLEFT"}, "text": "Encoder Layers', with an input feature size of 512, feed", "orig": "Encoder Layers', with an input feature size of 512, feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 148.96000000000004, "r_x1": 545.115, "r_y1": 148.96000000000004, "r_x2": 545.115, "r_y2": 140.40800000000002, "r_x3": 308.862, "r_y3": 140.40800000000002, "coord_origin": "TOPLEFT"}, "text": "forward network of 1024, and 4 attention heads. As for the", "orig": "forward network of 1024, and 4 attention heads. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 160.91499999999996, "r_x1": 545.115, "r_y1": 160.91499999999996, "r_x2": 545.115, "r_y2": 152.36300000000006, "r_x3": 308.862, "r_y3": 152.36300000000006, "coord_origin": "TOPLEFT"}, "text": "Transformer Decoder it is composed of four 'Transformer", "orig": "Transformer Decoder it is composed of four 'Transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 172.87, "r_x1": 545.115, "r_y1": 172.87, "r_x2": 545.115, "r_y2": 164.31799999999998, "r_x3": 308.862, "r_y3": 164.31799999999998, "coord_origin": "TOPLEFT"}, "text": "Decoder Layers' with similar input and output dimensions", "orig": "Decoder Layers' with similar input and output dimensions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 184.82600000000002, "r_x1": 317.161, "r_y1": 184.82600000000002, "r_x2": 317.161, "r_y2": 176.274, "r_x3": 308.862, "r_y3": 176.274, "coord_origin": "TOPLEFT"}, "text": "as", "orig": "as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 321.365, "r_y0": 184.82600000000002, "r_x1": 333.539, "r_y1": 184.82600000000002, "r_x2": 333.539, "r_y2": 176.274, "r_x3": 321.365, "r_y3": 176.274, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.734, "r_y0": 184.82600000000002, "r_x1": 467.218, "r_y1": 184.82600000000002, "r_x2": 467.218, "r_y2": 176.274, "r_x3": 337.734, "r_y3": 176.274, "coord_origin": "TOPLEFT"}, "text": "'Transformer Encoder Layers'.", "orig": "'Transformer Encoder Layers'.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.437, "r_y0": 184.82600000000002, "r_x1": 545.115, "r_y1": 184.82600000000002, "r_x2": 545.115, "r_y2": 176.274, "r_x3": 475.437, "r_y3": 176.274, "coord_origin": "TOPLEFT"}, "text": "Even though our", "orig": "Even though our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 196.78099999999995, "r_x1": 545.115, "r_y1": 196.78099999999995, "r_x2": 545.115, "r_y2": 188.22900000000004, "r_x3": 308.862, "r_y3": 188.22900000000004, "coord_origin": "TOPLEFT"}, "text": "model uses fewer layers and heads than the default imple-", "orig": "model uses fewer layers and heads than the default imple-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 208.736, "r_x1": 399.213, "r_y1": 208.736, "r_x2": 399.213, "r_y2": 200.18399999999997, "r_x3": 308.862, "r_y3": 200.18399999999997, "coord_origin": "TOPLEFT"}, "text": "mentation parameters,", "orig": "mentation parameters,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 403.965, "r_y0": 208.736, "r_x1": 458.63, "r_y1": 208.736, "r_x2": 458.63, "r_y2": 200.18399999999997, "r_x3": 403.965, "r_y3": 200.18399999999997, "coord_origin": "TOPLEFT"}, "text": "our extensive", "orig": "our extensive", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 462.934, "r_y0": 208.736, "r_x1": 545.115, "r_y1": 208.736, "r_x2": 545.115, "r_y2": 200.18399999999997, "r_x3": 462.934, "r_y3": 200.18399999999997, "coord_origin": "TOPLEFT"}, "text": "experimentation has", "orig": "experimentation has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 220.69100000000003, "r_x1": 527.84, "r_y1": 220.69100000000003, "r_x2": 527.84, "r_y2": 212.139, "r_x3": 308.862, "r_y3": 212.139, "coord_origin": "TOPLEFT"}, "text": "proved this setup to be more suitable for table images.", "orig": "proved this setup to be more suitable for table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.084, "r_y0": 220.69100000000003, "r_x1": 545.115, "r_y1": 220.69100000000003, "r_x2": 545.115, "r_y2": 212.139, "r_x3": 532.084, "r_y3": 212.139, "coord_origin": "TOPLEFT"}, "text": "We", "orig": "We", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 232.64599999999996, "r_x1": 341.868, "r_y1": 232.64599999999996, "r_x2": 341.868, "r_y2": 224.09400000000005, "r_x3": 308.862, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "attribute", "orig": "attribute", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.371, "r_y0": 232.64599999999996, "r_x1": 360.767, "r_y1": 232.64599999999996, "r_x2": 360.767, "r_y2": 224.09400000000005, "r_x3": 346.371, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.27, "r_y0": 232.64599999999996, "r_x1": 393.504, "r_y1": 232.64599999999996, "r_x2": 393.504, "r_y2": 224.09400000000005, "r_x3": 365.27, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "finding", "orig": "finding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.007, "r_y0": 232.64599999999996, "r_x1": 405.758, "r_y1": 232.64599999999996, "r_x2": 405.758, "r_y2": 224.09400000000005, "r_x3": 398.007, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.261, "r_y0": 232.64599999999996, "r_x1": 422.436, "r_y1": 232.64599999999996, "r_x2": 422.436, "r_y2": 224.09400000000005, "r_x3": 410.261, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.939, "r_y0": 232.64599999999996, "r_x1": 459.586, "r_y1": 232.64599999999996, "r_x2": 459.586, "r_y2": 224.09400000000005, "r_x3": 426.939, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "inherent", "orig": "inherent", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 464.089, "r_y0": 232.64599999999996, "r_x1": 490.102, "r_y1": 232.64599999999996, "r_x2": 490.102, "r_y2": 224.09400000000005, "r_x3": 464.089, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "design", "orig": "design", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 494.605, "r_y0": 232.64599999999996, "r_x1": 502.904, "r_y1": 232.64599999999996, "r_x2": 502.904, "r_y2": 224.09400000000005, "r_x3": 494.605, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 507.407, "r_y0": 232.64599999999996, "r_x1": 526.774, "r_y1": 232.64599999999996, "r_x2": 526.774, "r_y2": 224.09400000000005, "r_x3": 507.407, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 531.277, "r_y0": 232.64599999999996, "r_x1": 545.115, "r_y1": 232.64599999999996, "r_x2": 545.115, "r_y2": 224.09400000000005, "r_x3": 531.277, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "im-", "orig": "im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 244.601, "r_x1": 545.115, "r_y1": 244.601, "r_x2": 545.115, "r_y2": 236.04899999999998, "r_x3": 308.862, "r_y3": 236.04899999999998, "coord_origin": "TOPLEFT"}, "text": "ages, which contain mostly lines and text, unlike the more", "orig": "ages, which contain mostly lines and text, unlike the more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 256.557, "r_x1": 496.169, "r_y1": 256.557, "r_x2": 496.169, "r_y2": 248.005, "r_x3": 308.862, "r_y3": 248.005, "coord_origin": "TOPLEFT"}, "text": "elaborate content present in other scopes (e.g.", "orig": "elaborate content present in other scopes (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 501.897, "r_y0": 256.557, "r_x1": 545.115, "r_y1": 256.557, "r_x2": 545.115, "r_y2": 248.005, "r_x3": 501.897, "r_y3": 248.005, "coord_origin": "TOPLEFT"}, "text": "the COCO", "orig": "the COCO", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 268.51199999999994, "r_x1": 342.336, "r_y1": 268.51199999999994, "r_x2": 342.336, "r_y2": 259.96000000000004, "r_x3": 308.862, "r_y3": 259.96000000000004, "coord_origin": "TOPLEFT"}, "text": "dataset).", "orig": "dataset).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.952, "r_y0": 268.51199999999994, "r_x1": 545.115, "r_y1": 268.51199999999994, "r_x2": 545.115, "r_y2": 259.96000000000004, "r_x3": 348.952, "r_y3": 259.96000000000004, "coord_origin": "TOPLEFT"}, "text": "Moreover, we have added ResNet blocks to the", "orig": "Moreover, we have added ResNet blocks to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 280.467, "r_x1": 545.115, "r_y1": 280.467, "r_x2": 545.115, "r_y2": 271.91499999999996, "r_x3": 308.862, "r_y3": 271.91499999999996, "coord_origin": "TOPLEFT"}, "text": "inputs of the Structure Decoder and Cell BBox Decoder.", "orig": "inputs of the Structure Decoder and Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 292.422, "r_x1": 545.115, "r_y1": 292.422, "r_x2": 545.115, "r_y2": 283.87, "r_x3": 308.862, "r_y3": 283.87, "coord_origin": "TOPLEFT"}, "text": "This prevents a decoder having a stronger influence over the", "orig": "This prevents a decoder having a stronger influence over the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 304.377, "r_x1": 545.115, "r_y1": 304.377, "r_x2": 545.115, "r_y2": 295.825, "r_x3": 308.862, "r_y3": 295.825, "coord_origin": "TOPLEFT"}, "text": "learned weights which would damage the other prediction", "orig": "learned weights which would damage the other prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 316.332, "r_x1": 545.115, "r_y1": 316.332, "r_x2": 545.115, "r_y2": 307.78, "r_x3": 308.862, "r_y3": 307.78, "coord_origin": "TOPLEFT"}, "text": "task (structure vs bounding boxes), but learn task specific", "orig": "task (structure vs bounding boxes), but learn task specific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 328.288, "r_x1": 532.483, "r_y1": 328.288, "r_x2": 532.483, "r_y2": 319.736, "r_x3": 308.862, "r_y3": 319.736, "coord_origin": "TOPLEFT"}, "text": "weights instead. Lastly our dropout layers are set to 0.5.", "orig": "weights instead. Lastly our dropout layers are set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 345.398, "r_x1": 545.115, "r_y1": 345.398, "r_x2": 545.115, "r_y2": 336.846, "r_x3": 320.817, "r_y3": 336.846, "coord_origin": "TOPLEFT"}, "text": "For training, TableFormer is trained with 3 Adam opti-", "orig": "For training, TableFormer is trained with 3 Adam opti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 357.353, "r_x1": 403.736, "r_y1": 357.353, "r_x2": 403.736, "r_y2": 348.801, "r_x3": 308.862, "r_y3": 348.801, "coord_origin": "TOPLEFT"}, "text": "mizers, each one for the", "orig": "mizers, each one for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 406.076, "r_y0": 357.21, "r_x1": 545.112, "r_y1": 357.21, "r_x2": 545.112, "r_y2": 348.622, "r_x3": 406.076, "r_y3": 348.622, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network Structure", "orig": "CNN Backbone Network Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 503.539, "r_y0": 357.353, "r_x1": 506.03, "r_y1": 357.353, "r_x2": 506.03, "r_y2": 348.801, "r_x3": 503.539, "r_y3": 348.801, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 369.165, "r_x1": 343.163, "r_y1": 369.165, "r_x2": 343.163, "r_y2": 360.577, "r_x3": 308.862, "r_y3": 360.577, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 343.163, "r_y0": 369.308, "r_x1": 362.202, "r_y1": 369.308, "r_x2": 362.202, "r_y2": 360.756, "r_x3": 343.163, "r_y3": 360.756, "coord_origin": "TOPLEFT"}, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 364.286, "r_y0": 369.165, "r_x1": 440.938, "r_y1": 369.165, "r_x2": 440.938, "r_y2": 360.577, "r_x3": 364.286, "r_y3": 360.577, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.939, "r_y0": 369.308, "r_x1": 443.43, "r_y1": 369.308, "r_x2": 443.43, "r_y2": 360.756, "r_x3": 440.939, "r_y3": 360.756, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 446.379, "r_y0": 369.308, "r_x1": 545.108, "r_y1": 369.308, "r_x2": 545.108, "r_y2": 360.756, "r_x3": 446.379, "r_y3": 360.756, "coord_origin": "TOPLEFT"}, "text": "Taking the PubTabNet as", "orig": "Taking the PubTabNet as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 381.263, "r_x1": 545.115, "r_y1": 381.263, "r_x2": 545.115, "r_y2": 372.711, "r_x3": 308.862, "r_y3": 372.711, "coord_origin": "TOPLEFT"}, "text": "an example for our parameter set up, the initializing learn-", "orig": "an example for our parameter set up, the initializing learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 393.219, "r_x1": 545.115, "r_y1": 393.219, "r_x2": 545.115, "r_y2": 384.667, "r_x3": 308.862, "r_y3": 384.667, "coord_origin": "TOPLEFT"}, "text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 405.01, "r_x1": 314.673, "r_y1": 405.01, "r_x2": 314.673, "r_y2": 396.304, "r_x3": 308.862, "r_y3": 396.304, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.658, "r_y0": 405.174, "r_x1": 329.726, "r_y1": 405.174, "r_x2": 329.726, "r_y2": 396.622, "r_x3": 318.658, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "set", "orig": "set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.711, "r_y0": 405.174, "r_x1": 341.462, "r_y1": 405.174, "r_x2": 341.462, "r_y2": 396.622, "r_x3": 333.711, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.447, "r_y0": 405.174, "r_x1": 360.391, "r_y1": 405.174, "r_x2": 360.391, "r_y2": 396.622, "r_x3": 345.447, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "0.5.", "orig": "0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.963, "r_y0": 405.174, "r_x1": 415.166, "r_y1": 405.174, "r_x2": 415.166, "r_y2": 396.622, "r_x3": 367.963, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "Afterwards,", "orig": "Afterwards,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 419.519, "r_y0": 405.174, "r_x1": 545.108, "r_y1": 405.174, "r_x2": 545.108, "r_y2": 396.622, "r_x3": 419.519, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "we reduce the learning rate to", "orig": "we reduce the learning rate to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 417.129, "r_x1": 545.115, "r_y1": 417.129, "r_x2": 545.115, "r_y2": 408.577, "r_x3": 308.862, "r_y3": 408.577, "coord_origin": "TOPLEFT"}, "text": "0.0001, the batch size to 18 and train for 12 more epochs or", "orig": "0.0001, the batch size to 18 and train for 12 more epochs or", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 429.084, "r_x1": 360.966, "r_y1": 429.084, "r_x2": 360.966, "r_y2": 420.532, "r_x3": 308.862, "r_y3": 420.532, "coord_origin": "TOPLEFT"}, "text": "convergence.", "orig": "convergence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 446.195, "r_x1": 545.115, "r_y1": 446.195, "r_x2": 545.115, "r_y2": 437.643, "r_x3": 320.817, "r_y3": 437.643, "coord_origin": "TOPLEFT"}, "text": "TableFormer is implemented with PyTorch and Torchvi-", "orig": "TableFormer is implemented with PyTorch and Torchvi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 458.15, "r_x1": 384.628, "r_y1": 458.15, "r_x2": 384.628, "r_y2": 449.598, "r_x3": 308.862, "r_y3": 449.598, "coord_origin": "TOPLEFT"}, "text": "sion libraries [22].", "orig": "sion libraries [22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.372, "r_y0": 458.15, "r_x1": 545.115, "r_y1": 458.15, "r_x2": 545.115, "r_y2": 449.598, "r_x3": 391.372, "r_y3": 449.598, "coord_origin": "TOPLEFT"}, "text": "To speed up the inference, the image", "orig": "To speed up the inference, the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 470.105, "r_x1": 494.007, "r_y1": 470.105, "r_x2": 494.007, "r_y2": 461.553, "r_x3": 308.862, "r_y3": 461.553, "coord_origin": "TOPLEFT"}, "text": "undergoes a single forward pass through the", "orig": "undergoes a single forward pass through the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.078, "r_y0": 469.962, "r_x1": 545.111, "r_y1": 469.962, "r_x2": 545.111, "r_y2": 461.374, "r_x3": 498.078, "r_y3": 461.374, "coord_origin": "TOPLEFT"}, "text": "CNN Back-", "orig": "CNN Back-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 481.917, "r_x1": 364.443, "r_y1": 481.917, "r_x2": 364.443, "r_y2": 473.329, "r_x3": 308.862, "r_y3": 473.329, "coord_origin": "TOPLEFT"}, "text": "bone Network", "orig": "bone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.061, "r_y0": 482.06, "r_x1": 545.113, "r_y1": 482.06, "r_x2": 545.113, "r_y2": 473.508, "r_x3": 367.061, "r_y3": 473.508, "coord_origin": "TOPLEFT"}, "text": "and transformer encoder. This eliminates the", "orig": "and transformer encoder. This eliminates the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 494.015, "r_x1": 545.115, "r_y1": 494.015, "r_x2": 545.115, "r_y2": 485.463, "r_x3": 308.862, "r_y3": 485.463, "coord_origin": "TOPLEFT"}, "text": "overhead of generating the same features for each decoding", "orig": "overhead of generating the same features for each decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 505.97, "r_x1": 545.115, "r_y1": 505.97, "r_x2": 545.115, "r_y2": 497.418, "r_x3": 308.862, "r_y3": 497.418, "coord_origin": "TOPLEFT"}, "text": "step. Similarly, we employ a 'caching' technique to preform", "orig": "step. Similarly, we employ a 'caching' technique to preform", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 517.9259999999999, "r_x1": 432.588, "r_y1": 517.9259999999999, "r_x2": 432.588, "r_y2": 509.374, "r_x3": 308.862, "r_y3": 509.374, "coord_origin": "TOPLEFT"}, "text": "faster autoregressive decoding.", "orig": "faster autoregressive decoding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 517.9259999999999, "r_x1": 545.115, "r_y1": 517.9259999999999, "r_x2": 545.115, "r_y2": 509.374, "r_x3": 436.732, "r_y3": 509.374, "coord_origin": "TOPLEFT"}, "text": "This is achieved by storing", "orig": "This is achieved by storing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 529.881, "r_x1": 545.115, "r_y1": 529.881, "r_x2": 545.115, "r_y2": 521.329, "r_x3": 308.862, "r_y3": 521.329, "coord_origin": "TOPLEFT"}, "text": "the features of decoded tokens so we can reuse them for", "orig": "the features of decoded tokens so we can reuse them for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 541.836, "r_x1": 370.062, "r_y1": 541.836, "r_x2": 370.062, "r_y2": 533.284, "r_x3": 308.862, "r_y3": 533.284, "coord_origin": "TOPLEFT"}, "text": "each time step.", "orig": "each time step.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.721, "r_y0": 541.836, "r_x1": 545.115, "r_y1": 541.836, "r_x2": 545.115, "r_y2": 533.284, "r_x3": 375.721, "r_y3": 533.284, "coord_origin": "TOPLEFT"}, "text": "Therefore, we only compute the attention", "orig": "Therefore, we only compute the attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 553.7909999999999, "r_x1": 377.215, "r_y1": 553.7909999999999, "r_x2": 377.215, "r_y2": 545.239, "r_x3": 308.862, "r_y3": 545.239, "coord_origin": "TOPLEFT"}, "text": "for each new tag.", "orig": "for each new tag.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 589.406, "r_x1": 397.443, "r_y1": 589.406, "r_x2": 397.443, "r_y2": 579.554, "r_x3": 308.862, "r_y3": 579.554, "coord_origin": "TOPLEFT"}, "text": "5.2. Generalization", "orig": "5.2. Generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 612.27, "r_x1": 545.115, "r_y1": 612.27, "r_x2": 545.115, "r_y2": 603.718, "r_x3": 320.817, "r_y3": 603.718, "coord_origin": "TOPLEFT"}, "text": "TableFormer is evaluated on three major publicly avail-", "orig": "TableFormer is evaluated on three major publicly avail-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 624.225, "r_x1": 545.115, "r_y1": 624.225, "r_x2": 545.115, "r_y2": 615.673, "r_x3": 308.862, "r_y3": 615.673, "coord_origin": "TOPLEFT"}, "text": "able datasets of different nature to prove the generalization", "orig": "able datasets of different nature to prove the generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 636.1800000000001, "r_x1": 545.115, "r_y1": 636.1800000000001, "r_x2": 545.115, "r_y2": 627.6279999999999, "r_x3": 308.862, "r_y3": 627.6279999999999, "coord_origin": "TOPLEFT"}, "text": "and effectiveness of our model. The datasets used for eval-", "orig": "and effectiveness of our model. The datasets used for eval-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 648.135, "r_x1": 545.115, "r_y1": 648.135, "r_x2": 545.115, "r_y2": 639.583, "r_x3": 308.862, "r_y3": 639.583, "coord_origin": "TOPLEFT"}, "text": "uation are the PubTabNet, FinTabNet and TableBank which", "orig": "uation are the PubTabNet, FinTabNet and TableBank which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 660.091, "r_x1": 545.115, "r_y1": 660.091, "r_x2": 545.115, "r_y2": 651.539, "r_x3": 308.862, "r_y3": 651.539, "coord_origin": "TOPLEFT"}, "text": "stem from the scientific, financial and general domains re-", "orig": "stem from the scientific, financial and general domains re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 672.046, "r_x1": 350.705, "r_y1": 672.046, "r_x2": 350.705, "r_y2": 663.494, "r_x3": 308.862, "r_y3": 663.494, "coord_origin": "TOPLEFT"}, "text": "spectively.", "orig": "spectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 320.817, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "We also share our baseline results on the challenging", "orig": "We also share our baseline results on the challenging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 361.196, "r_y1": 701.111, "r_x2": 361.196, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 203, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.057, "r_y0": 701.111, "r_x1": 396.214, "r_y1": 701.111, "r_x2": 396.214, "r_y2": 692.559, "r_x3": 366.057, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "dataset.", "orig": "dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 204, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 406.406, "r_y0": 701.111, "r_x1": 453.449, "r_y1": 701.111, "r_x2": 453.449, "r_y2": 692.559, "r_x3": 406.406, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Throughout", "orig": "Throughout", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 205, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.311, "r_y0": 701.111, "r_x1": 471.591, "r_y1": 701.111, "r_x2": 471.591, "r_y2": 692.559, "r_x3": 458.311, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 206, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.453, "r_y0": 701.111, "r_x1": 527.481, "r_y1": 701.111, "r_x2": 527.481, "r_y2": 692.559, "r_x3": 476.453, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "experiments,", "orig": "experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 207, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.941, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 532.941, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 208, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.067, "r_x1": 495.94, "r_y1": 713.067, "r_x2": 495.94, "r_y2": 704.515, "r_x3": 308.862, "r_y3": 704.515, "coord_origin": "TOPLEFT"}, "text": "same parameters stated in Sec. 5.1 are utilized.", "orig": "same parameters stated in Sec. 5.1 are utilized.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 209, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 5, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 286.365, "b": 155.76, "coord_origin": "TOPLEFT"}, "confidence": 0.9868090152740479, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "tention encoding is then multiplied to the encoded image to", "orig": "tention encoding is then multiplied to the encoded image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 95.98400000000004, "r_x1": 286.365, "r_y1": 95.98400000000004, "r_x2": 286.365, "r_y2": 87.43200000000002, "r_x3": 50.112, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "produce a feature for each table cell. Notice that this is dif-", "orig": "produce a feature for each table cell. Notice that this is dif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 107.93899999999996, "r_x1": 286.365, "r_y1": 107.93899999999996, "r_x2": 286.365, "r_y2": 99.38699999999994, "r_x3": 50.112, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "ferent than the typical object detection problem where im-", "orig": "ferent than the typical object detection problem where im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 119.894, "r_x1": 286.365, "r_y1": 119.894, "r_x2": 286.365, "r_y2": 111.34199999999998, "r_x3": 50.112, "r_y3": 111.34199999999998, "coord_origin": "TOPLEFT"}, "text": "balances between the number of detections and the amount", "orig": "balances between the number of detections and the amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 131.84900000000005, "r_x1": 135.691, "r_y1": 131.84900000000005, "r_x2": 135.691, "r_y2": 123.29700000000003, "r_x3": 50.112, "r_y3": 123.29700000000003, "coord_origin": "TOPLEFT"}, "text": "of objects may exist.", "orig": "of objects may exist.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.047, "r_y0": 131.84900000000005, "r_x1": 286.365, "r_y1": 131.84900000000005, "r_x2": 286.365, "r_y2": 123.29700000000003, "r_x3": 142.047, "r_y3": 123.29700000000003, "coord_origin": "TOPLEFT"}, "text": "In our case, we know up front that", "orig": "In our case, we know up front that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 143.80499999999995, "r_x1": 286.365, "r_y1": 143.80499999999995, "r_x2": 286.365, "r_y2": 135.25300000000004, "r_x3": 50.112, "r_y3": 135.25300000000004, "coord_origin": "TOPLEFT"}, "text": "the produced detections always match with the table cells", "orig": "the produced detections always match with the table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 155.76, "r_x1": 175.163, "r_y1": 155.76, "r_x2": 175.163, "r_y2": 147.20799999999997, "r_x3": 50.112, "r_y3": 147.20799999999997, "coord_origin": "TOPLEFT"}, "text": "in number and correspondence.", "orig": "in number and correspondence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "text", "bbox": {"l": 50.112, "t": 159.89300000000003, "r": 286.365, "b": 240.17700000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9860327839851379, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 168.44500000000005, "r_x1": 108.154, "r_y1": 168.44500000000005, "r_x2": 108.154, "r_y2": 159.89300000000003, "r_x3": 62.067, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "The output", "orig": "The output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.275, "r_y0": 168.44500000000005, "r_x1": 144.806, "r_y1": 168.44500000000005, "r_x2": 144.806, "r_y2": 159.89300000000003, "r_x3": 113.275, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "features", "orig": "features", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.937, "r_y0": 168.44500000000005, "r_x1": 161.554, "r_y1": 168.44500000000005, "r_x2": 161.554, "r_y2": 159.89300000000003, "r_x3": 149.937, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.684, "r_y0": 168.44500000000005, "r_x1": 184.936, "r_y1": 168.44500000000005, "r_x2": 184.936, "r_y2": 159.89300000000003, "r_x3": 166.684, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "each", "orig": "each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 190.057, "r_y0": 168.44500000000005, "r_x1": 209.424, "r_y1": 168.44500000000005, "r_x2": 209.424, "r_y2": 159.89300000000003, "r_x3": 190.057, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.555, "r_y0": 168.44500000000005, "r_x1": 228.941, "r_y1": 168.44500000000005, "r_x2": 228.941, "r_y2": 159.89300000000003, "r_x3": 214.555, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "cell", "orig": "cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.061, "r_y0": 168.44500000000005, "r_x1": 246.226, "r_y1": 168.44500000000005, "r_x2": 246.226, "r_y2": 159.89300000000003, "r_x3": 234.061, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "are", "orig": "are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.356, "r_y0": 168.44500000000005, "r_x1": 268.512, "r_y1": 168.44500000000005, "r_x2": 268.512, "r_y2": 159.89300000000003, "r_x3": 251.356, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "then", "orig": "then", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 273.643, "r_y0": 168.44500000000005, "r_x1": 286.365, "r_y1": 168.44500000000005, "r_x2": 286.365, "r_y2": 159.89300000000003, "r_x3": 273.643, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "fed", "orig": "fed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 180.40099999999995, "r_x1": 65.614, "r_y1": 180.40099999999995, "r_x2": 65.614, "r_y2": 171.84900000000005, "r_x3": 50.112, "r_y3": 171.84900000000005, "coord_origin": "TOPLEFT"}, "text": "into", "orig": "into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.107, "r_y0": 180.40099999999995, "r_x1": 82.281, "r_y1": 180.40099999999995, "r_x2": 82.281, "r_y2": 171.84900000000005, "r_x3": 70.107, "r_y3": 171.84900000000005, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.764, "r_y0": 180.40099999999995, "r_x1": 138.66, "r_y1": 180.40099999999995, "r_x2": 138.66, "r_y2": 171.84900000000005, "r_x3": 86.764, "r_y3": 171.84900000000005, "coord_origin": "TOPLEFT"}, "text": "feed-forward", "orig": "feed-forward", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.153, "r_y0": 180.40099999999995, "r_x1": 286.365, "r_y1": 180.40099999999995, "r_x2": 286.365, "r_y2": 171.84900000000005, "r_x3": 143.153, "r_y3": 171.84900000000005, "coord_origin": "TOPLEFT"}, "text": "network (FFN). The FFN consists", "orig": "network (FFN). The FFN consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 192.356, "r_x1": 286.365, "r_y1": 192.356, "r_x2": 286.365, "r_y2": 183.80399999999997, "r_x3": 50.112, "r_y3": 183.80399999999997, "coord_origin": "TOPLEFT"}, "text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 204.31100000000004, "r_x1": 286.365, "r_y1": 204.31100000000004, "r_x2": 286.365, "r_y2": 195.75900000000001, "r_x3": 50.112, "r_y3": 195.75900000000001, "coord_origin": "TOPLEFT"}, "text": "tion function) that predicts the normalized coordinates for", "orig": "tion function) that predicts the normalized coordinates for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 216.26599999999996, "r_x1": 196.004, "r_y1": 216.26599999999996, "r_x2": 196.004, "r_y2": 207.71400000000006, "r_x3": 50.112, "r_y3": 207.71400000000006, "coord_origin": "TOPLEFT"}, "text": "the bounding box of each table cell.", "orig": "the bounding box of each table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.786, "r_y0": 216.26599999999996, "r_x1": 286.365, "r_y1": 216.26599999999996, "r_x2": 286.365, "r_y2": 207.71400000000006, "r_x3": 200.786, "r_y3": 207.71400000000006, "coord_origin": "TOPLEFT"}, "text": "Finally, the predicted", "orig": "Finally, the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 228.221, "r_x1": 286.365, "r_y1": 228.221, "r_x2": 286.365, "r_y2": 219.66899999999998, "r_x3": 50.112, "r_y3": 219.66899999999998, "coord_origin": "TOPLEFT"}, "text": "bounding boxes are classified based on whether they are", "orig": "bounding boxes are classified based on whether they are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 240.17700000000002, "r_x1": 181.549, "r_y1": 240.17700000000002, "r_x2": 181.549, "r_y2": 231.625, "r_x3": 50.112, "r_y3": 231.625, "coord_origin": "TOPLEFT"}, "text": "empty or not using a linear layer.", "orig": "empty or not using a linear layer.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "text", "bbox": {"l": 50.112, "t": 243.92200000000003, "r": 286.366, "b": 444.145, "coord_origin": "TOPLEFT"}, "confidence": 0.9873637557029724, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 252.87800000000004, "r_x1": 129.215, "r_y1": 252.87800000000004, "r_x2": 129.215, "r_y2": 243.92200000000003, "r_x3": 62.067, "r_y3": 243.92200000000003, "coord_origin": "TOPLEFT"}, "text": "Loss Functions.", "orig": "Loss Functions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.451, "r_y0": 252.86199999999997, "r_x1": 276.139, "r_y1": 252.86199999999997, "r_x2": 276.139, "r_y2": 244.30999999999995, "r_x3": 134.451, "r_y3": 244.30999999999995, "coord_origin": "TOPLEFT"}, "text": "We formulate a multi-task loss Eq.", "orig": "We formulate a multi-task loss Eq.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.379, "r_y0": 252.86199999999997, "r_x1": 286.361, "r_y1": 252.86199999999997, "r_x2": 286.361, "r_y2": 244.30999999999995, "r_x3": 281.379, "r_y3": 244.30999999999995, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 264.817, "r_x1": 134.685, "r_y1": 264.817, "r_x2": 134.685, "r_y2": 256.265, "r_x3": 50.112, "r_y3": 256.265, "coord_origin": "TOPLEFT"}, "text": "to train our network.", "orig": "to train our network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.543, "r_y0": 264.817, "r_x1": 286.365, "r_y1": 264.817, "r_x2": 286.365, "r_y2": 256.265, "r_x3": 140.543, "r_y3": 256.265, "coord_origin": "TOPLEFT"}, "text": "The Cross-Entropy loss (denoted as", "orig": "The Cross-Entropy loss (denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 276.60900000000004, "r_x1": 53.085, "r_y1": 276.60900000000004, "r_x2": 53.085, "r_y2": 267.903, "r_x3": 50.112, "r_y3": 267.903, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.085, "r_y0": 277.53200000000004, "r_x1": 56.845, "r_y1": 277.53200000000004, "r_x2": 56.845, "r_y2": 271.438, "r_x3": 53.085, "r_y3": 271.438, "coord_origin": "TOPLEFT"}, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 57.343, "r_y0": 276.773, "r_x1": 135.4, "r_y1": 276.773, "r_x2": 135.4, "r_y2": 268.221, "r_x3": 57.343, "r_y3": 268.221, "coord_origin": "TOPLEFT"}, "text": ") is used to train the", "orig": ") is used to train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.735, "r_y0": 276.63, "r_x1": 211.08, "r_y1": 276.63, "r_x2": 211.08, "r_y2": 268.04200000000003, "r_x3": 137.735, "r_y3": 268.04200000000003, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 213.637, "r_y0": 276.773, "r_x1": 286.364, "r_y1": 276.773, "r_x2": 286.364, "r_y2": 268.221, "r_x3": 213.637, "r_y3": 268.221, "coord_origin": "TOPLEFT"}, "text": "which predicts the", "orig": "which predicts the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 288.728, "r_x1": 158.824, "r_y1": 288.728, "r_x2": 158.824, "r_y2": 280.176, "r_x3": 50.112, "r_y3": 280.176, "coord_origin": "TOPLEFT"}, "text": "structure tokens. As for the", "orig": "structure tokens. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.318, "r_y0": 288.585, "r_x1": 238.797, "r_y1": 288.585, "r_x2": 238.797, "r_y2": 279.99699999999996, "r_x3": 161.318, "r_y3": 279.99699999999996, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.521, "r_y0": 288.728, "r_x1": 286.363, "r_y1": 288.728, "r_x2": 286.363, "r_y2": 280.176, "r_x3": 241.521, "r_y3": 280.176, "coord_origin": "TOPLEFT"}, "text": "it is trained", "orig": "it is trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 300.683, "r_x1": 211.377, "r_y1": 300.683, "r_x2": 211.377, "r_y2": 292.131, "r_x3": 50.112, "r_y3": 292.131, "coord_origin": "TOPLEFT"}, "text": "with a combination of losses denoted as", "orig": "with a combination of losses denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.271, "r_y0": 300.519, "r_x1": 217.244, "r_y1": 300.519, "r_x2": 217.244, "r_y2": 291.813, "r_x3": 214.271, "r_y3": 291.813, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.244, "r_y0": 301.442, "r_x1": 229.198, "r_y1": 301.442, "r_x2": 229.198, "r_y2": 295.348, "r_x3": 217.244, "r_y3": 295.348, "coord_origin": "TOPLEFT"}, "text": "box", "orig": "box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.696, "r_y0": 300.683, "r_x1": 232.187, "r_y1": 300.683, "r_x2": 232.187, "r_y2": 292.131, "r_x3": 229.696, "r_y3": 292.131, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.49, "r_y0": 300.519, "r_x1": 239.463, "r_y1": 300.519, "r_x2": 239.463, "r_y2": 291.813, "r_x3": 236.49, "r_y3": 291.813, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.463, "r_y0": 301.442, "r_x1": 251.417, "r_y1": 301.442, "r_x2": 251.417, "r_y2": 295.348, "r_x3": 239.463, "r_y3": 295.348, "coord_origin": "TOPLEFT"}, "text": "box", "orig": "box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 254.811, "r_y0": 300.683, "r_x1": 286.363, "r_y1": 300.683, "r_x2": 286.363, "r_y2": 292.131, "r_x3": 254.811, "r_y3": 292.131, "coord_origin": "TOPLEFT"}, "text": "consists", "orig": "consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 312.638, "r_x1": 137.454, "r_y1": 312.638, "r_x2": 137.454, "r_y2": 304.086, "r_x3": 50.112, "r_y3": 304.086, "coord_origin": "TOPLEFT"}, "text": "of the generally used", "orig": "of the generally used", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.298, "r_y0": 312.474, "r_x1": 144.271, "r_y1": 312.474, "r_x2": 144.271, "r_y2": 303.768, "r_x3": 141.298, "r_y3": 303.768, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 144.271, "r_y0": 313.398, "r_x1": 148.243, "r_y1": 313.398, "r_x2": 148.243, "r_y2": 307.304, "r_x3": 144.271, "r_y3": 307.304, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.586, "r_y0": 312.638, "r_x1": 286.364, "r_y1": 312.638, "r_x2": 286.364, "r_y2": 304.086, "r_x3": 152.586, "r_y3": 304.086, "coord_origin": "TOPLEFT"}, "text": "loss for object detection and the", "orig": "loss for object detection and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 324.593, "r_x1": 89.683, "r_y1": 324.593, "r_x2": 89.683, "r_y2": 316.041, "r_x3": 50.112, "r_y3": 316.041, "coord_origin": "TOPLEFT"}, "text": "IoU loss (", "orig": "IoU loss (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 89.686, "r_y0": 324.429, "r_x1": 92.659, "r_y1": 324.429, "r_x2": 92.659, "r_y2": 315.723, "r_x3": 89.686, "r_y3": 315.723, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.659, "r_y0": 325.353, "r_x1": 104.12, "r_y1": 325.353, "r_x2": 104.12, "r_y2": 319.259, "r_x3": 92.659, "r_y3": 319.259, "coord_origin": "TOPLEFT"}, "text": "iou", "orig": "iou", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 104.618, "r_y0": 324.593, "r_x1": 286.366, "r_y1": 324.593, "r_x2": 286.366, "r_y2": 316.041, "r_x3": 104.618, "r_y3": 316.041, "coord_origin": "TOPLEFT"}, "text": ") to be scale invariant as explained in [25]. In", "orig": ") to be scale invariant as explained in [25]. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 336.549, "r_x1": 286.365, "r_y1": 336.549, "r_x2": 286.365, "r_y2": 327.997, "r_x3": 50.112, "r_y3": 327.997, "coord_origin": "TOPLEFT"}, "text": "comparison to DETR, we do not use the Hungarian algo-", "orig": "comparison to DETR, we do not use the Hungarian algo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 348.504, "r_x1": 286.365, "r_y1": 348.504, "r_x2": 286.365, "r_y2": 339.952, "r_x3": 50.112, "r_y3": 339.952, "coord_origin": "TOPLEFT"}, "text": "rithm [15] to match the predicted bounding boxes with the", "orig": "rithm [15] to match the predicted bounding boxes with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 360.459, "r_x1": 286.365, "r_y1": 360.459, "r_x2": 286.365, "r_y2": 351.907, "r_x3": 50.112, "r_y3": 351.907, "coord_origin": "TOPLEFT"}, "text": "ground-truth boxes, as we have already achieved a one-to-", "orig": "ground-truth boxes, as we have already achieved a one-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 372.414, "r_x1": 286.365, "r_y1": 372.414, "r_x2": 286.365, "r_y2": 363.862, "r_x3": 50.112, "r_y3": 363.862, "coord_origin": "TOPLEFT"}, "text": "one match through two steps: 1) Our token input sequence", "orig": "one match through two steps: 1) Our token input sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 384.369, "r_x1": 286.365, "r_y1": 384.369, "r_x2": 286.365, "r_y2": 375.817, "r_x3": 50.112, "r_y3": 375.817, "coord_origin": "TOPLEFT"}, "text": "is naturally ordered, therefore the hidden states of the table", "orig": "is naturally ordered, therefore the hidden states of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 396.324, "r_x1": 286.365, "r_y1": 396.324, "r_x2": 286.365, "r_y2": 387.772, "r_x3": 50.112, "r_y3": 387.772, "coord_origin": "TOPLEFT"}, "text": "data cells are also in order when they are provided as in-", "orig": "data cells are also in order when they are provided as in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 408.28, "r_x1": 88.687, "r_y1": 408.28, "r_x2": 88.687, "r_y2": 399.728, "r_x3": 50.112, "r_y3": 399.728, "coord_origin": "TOPLEFT"}, "text": "put to the", "orig": "put to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.646, "r_y0": 408.137, "r_x1": 170.052, "r_y1": 408.137, "r_x2": 170.052, "r_y2": 399.549, "r_x3": 91.646, "r_y3": 399.549, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.051, "r_y0": 408.28, "r_x1": 172.542, "r_y1": 408.28, "r_x2": 172.542, "r_y2": 399.728, "r_x3": 170.051, "r_y3": 399.728, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.62, "r_y0": 408.28, "r_x1": 286.364, "r_y1": 408.28, "r_x2": 286.364, "r_y2": 399.728, "r_x3": 175.62, "r_y3": 399.728, "coord_origin": "TOPLEFT"}, "text": "and 2) Our bounding boxes", "orig": "and 2) Our bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 420.235, "r_x1": 181.967, "r_y1": 420.235, "r_x2": 181.967, "r_y2": 411.683, "r_x3": 50.112, "r_y3": 411.683, "coord_origin": "TOPLEFT"}, "text": "generation mechanism (see Sec.", "orig": "generation mechanism (see Sec.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 189.09, "r_y0": 420.235, "r_x1": 286.365, "r_y1": 420.235, "r_x2": 286.365, "r_y2": 411.683, "r_x3": 189.09, "r_y3": 411.683, "coord_origin": "TOPLEFT"}, "text": "3) ensures a one-to-one", "orig": "3) ensures a one-to-one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 432.19, "r_x1": 286.365, "r_y1": 432.19, "r_x2": 286.365, "r_y2": 423.638, "r_x3": 50.112, "r_y3": 423.638, "coord_origin": "TOPLEFT"}, "text": "mapping between the cell content and its bounding box for", "orig": "mapping between the cell content and its bounding box for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 444.145, "r_x1": 158.296, "r_y1": 444.145, "r_x2": 158.296, "r_y2": 435.593, "r_x3": 50.112, "r_y3": 435.593, "coord_origin": "TOPLEFT"}, "text": "all post-processed datasets.", "orig": "all post-processed datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "text", "bbox": {"l": 50.112, "t": 448.279, "r": 286.365, "b": 468.786, "coord_origin": "TOPLEFT"}, "confidence": 0.9724196195602417, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 456.831, "r_x1": 286.365, "r_y1": 456.831, "r_x2": 286.365, "r_y2": 448.279, "r_x3": 62.067, "r_y3": 448.279, "coord_origin": "TOPLEFT"}, "text": "The loss used to train the TableFormer can be defined as", "orig": "The loss used to train the TableFormer can be defined as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 468.786, "r_x1": 91.377, "r_y1": 468.786, "r_x2": 91.377, "r_y2": 460.234, "r_x3": 50.112, "r_y3": 460.234, "coord_origin": "TOPLEFT"}, "text": "following:", "orig": "following:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "formula", "bbox": {"l": 124.33, "t": 493.391, "r": 286.362, "b": 517.9639999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9423348307609558, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.715, "r_y0": 502.097, "r_x1": 128.688, "r_y1": 502.097, "r_x2": 128.688, "r_y2": 493.391, "r_x3": 125.715, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.688, "r_y0": 503.02, "r_x1": 140.642, "r_y1": 503.02, "r_x2": 140.642, "r_y2": 496.926, "r_x3": 128.688, "r_y3": 496.926, "coord_origin": "TOPLEFT"}, "text": "box", "orig": "box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.907, "r_y0": 502.097, "r_x1": 151.656, "r_y1": 502.097, "r_x2": 151.656, "r_y2": 493.391, "r_x3": 143.907, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.423, "r_y0": 502.097, "r_x1": 160.234, "r_y1": 502.097, "r_x2": 160.234, "r_y2": 493.391, "r_x3": 154.423, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.235, "r_y0": 503.02, "r_x1": 186.628, "r_y1": 503.02, "r_x2": 186.628, "r_y2": 496.926, "r_x3": 160.235, "r_y3": 496.926, "coord_origin": "TOPLEFT"}, "text": "iou iou", "orig": "iou iou", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.194, "r_y0": 502.097, "r_x1": 175.167, "r_y1": 502.097, "r_x2": 175.167, "r_y2": 493.391, "r_x3": 172.194, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 189.34, "r_y0": 502.097, "r_x1": 197.089, "r_y1": 502.097, "r_x2": 197.089, "r_y2": 493.391, "r_x3": 189.34, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "+", "orig": "+", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.303, "r_y0": 502.097, "r_x1": 205.114, "r_y1": 502.097, "r_x2": 205.114, "r_y2": 493.391, "r_x3": 199.303, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 205.115, "r_y0": 503.02, "r_x1": 207.635, "r_y1": 503.02, "r_x2": 207.635, "r_y2": 496.926, "r_x3": 205.115, "r_y3": 496.926, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.675, "r_y0": 503.02, "r_x1": 211.647, "r_y1": 503.02, "r_x2": 211.647, "r_y2": 496.926, "r_x3": 207.675, "r_y3": 496.926, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.33, "r_y0": 517.0409999999999, "r_x1": 127.303, "r_y1": 517.0409999999999, "r_x2": 127.303, "r_y2": 508.335, "r_x3": 124.33, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 130.266, "r_y0": 517.0409999999999, "r_x1": 138.015, "r_y1": 517.0409999999999, "r_x2": 138.015, "r_y2": 508.335, "r_x3": 130.266, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.782, "r_y0": 517.0409999999999, "r_x1": 149.566, "r_y1": 517.0409999999999, "r_x2": 149.566, "r_y2": 508.335, "r_x3": 140.782, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "\u03bbl", "orig": "\u03bbl", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.566, "r_y0": 517.9639999999999, "r_x1": 153.326, "r_y1": 517.9639999999999, "r_x2": 153.326, "r_y2": 511.87, "r_x3": 149.566, "r_y3": 511.87, "coord_origin": "TOPLEFT"}, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 156.039, "r_y0": 517.0409999999999, "r_x1": 174.855, "r_y1": 517.0409999999999, "r_x2": 174.855, "r_y2": 508.335, "r_x3": 156.039, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "+(1", "orig": "+(1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.071, "r_y0": 516.899, "r_x1": 184.82, "r_y1": 516.899, "r_x2": 184.82, "r_y2": 508.335, "r_x3": 177.071, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.033, "r_y0": 517.0409999999999, "r_x1": 199.692, "r_y1": 517.0409999999999, "r_x2": 199.692, "r_y2": 508.335, "r_x3": 187.033, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "\u03bb l", "orig": "\u03bb l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 192.845, "r_y0": 517.0409999999999, "r_x1": 196.719, "r_y1": 517.0409999999999, "r_x2": 196.719, "r_y2": 508.335, "r_x3": 192.845, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.692, "r_y0": 517.9639999999999, "r_x1": 211.646, "r_y1": 517.9639999999999, "r_x2": 211.646, "r_y2": 511.87, "r_x3": 199.692, "r_y3": 511.87, "coord_origin": "TOPLEFT"}, "text": "box", "orig": "box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.746, "r_y0": 509.832, "r_x1": 286.362, "r_y1": 509.832, "r_x2": 286.362, "r_y2": 501.28, "r_x3": 274.746, "r_y3": 501.28, "coord_origin": "TOPLEFT"}, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 50.112, "t": 531.26, "r": 281.597, "b": 540.889, "coord_origin": "TOPLEFT"}, "confidence": 0.9363929629325867, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 540.13, "r_x1": 74.451, "r_y1": 540.13, "r_x2": 74.451, "r_y2": 531.578, "r_x3": 50.112, "r_y3": 531.578, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.941, "r_y0": 539.966, "r_x1": 82.752, "r_y1": 539.966, "r_x2": 82.752, "r_y2": 531.26, "r_x3": 76.941, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.52, "r_y0": 539.8240000000001, "r_x1": 92.162, "r_y1": 539.8240000000001, "r_x2": 92.162, "r_y2": 531.26, "r_x3": 85.52, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": "\u2208", "orig": "\u2208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.653, "r_y0": 540.13, "r_x1": 135.599, "r_y1": 540.13, "r_x2": 135.599, "r_y2": 531.578, "r_x3": 94.653, "r_y3": 531.578, "coord_origin": "TOPLEFT"}, "text": "[0, 1], and", "orig": "[0, 1], and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.09, "r_y0": 539.966, "r_x1": 143.901, "r_y1": 539.966, "r_x2": 143.901, "r_y2": 531.26, "r_x3": 138.09, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.901, "r_y0": 540.889, "r_x1": 155.362, "r_y1": 540.889, "r_x2": 155.362, "r_y2": 534.7950000000001, "r_x3": 143.901, "r_y3": 534.7950000000001, "coord_origin": "TOPLEFT"}, "text": "iou", "orig": "iou", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.861, "r_y0": 539.966, "r_x1": 166.104, "r_y1": 539.966, "r_x2": 166.104, "r_y2": 531.26, "r_x3": 155.861, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": ", \u03bb", "orig": ", \u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.1, "r_y0": 540.889, "r_x1": 168.62, "r_y1": 540.889, "r_x2": 168.62, "r_y2": 534.7950000000001, "r_x3": 166.1, "r_y3": 534.7950000000001, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.66, "r_y0": 540.889, "r_x1": 172.632, "r_y1": 540.889, "r_x2": 172.632, "r_y2": 534.7950000000001, "r_x3": 168.66, "r_y3": 534.7950000000001, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.897, "r_y0": 539.8240000000001, "r_x1": 182.539, "r_y1": 539.8240000000001, "r_x2": 182.539, "r_y2": 531.26, "r_x3": 175.897, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": "\u2208", "orig": "\u2208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.306, "r_y0": 538.064, "r_x1": 192.501, "r_y1": 538.064, "r_x2": 192.501, "r_y2": 533.441, "r_x3": 185.306, "r_y3": 533.441, "coord_origin": "TOPLEFT"}, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.992, "r_y0": 540.13, "r_x1": 281.597, "r_y1": 540.13, "r_x2": 281.597, "r_y2": 531.578, "r_x3": 194.992, "r_y3": 531.578, "coord_origin": "TOPLEFT"}, "text": "are hyper-parameters.", "orig": "are hyper-parameters.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "section_header", "bbox": {"l": 50.112, "t": 555.917, "r": 171.983, "b": 566.665, "coord_origin": "TOPLEFT"}, "confidence": 0.9554555416107178, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 566.665, "r_x1": 171.983, "r_y1": 566.665, "r_x2": 171.983, "r_y2": 555.917, "r_x3": 50.112, "r_y3": 555.917, "coord_origin": "TOPLEFT"}, "text": "5. Experimental Results", "orig": "5. Experimental Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "section_header", "bbox": {"l": 50.112, "t": 576.264, "r": 179.175, "b": 586.116, "coord_origin": "TOPLEFT"}, "confidence": 0.9538503289222717, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 586.116, "r_x1": 179.175, "r_y1": 586.116, "r_x2": 179.175, "r_y2": 576.264, "r_x3": 50.112, "r_y3": 576.264, "coord_origin": "TOPLEFT"}, "text": "5.1. Implementation Details", "orig": "5.1. Implementation Details", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "text", "bbox": {"l": 50.112, "t": 595.8240000000001, "r": 286.365, "b": 640.421, "coord_origin": "TOPLEFT"}, "confidence": 0.9856163263320923, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 604.5550000000001, "r_x1": 202.978, "r_y1": 604.5550000000001, "r_x2": 202.978, "r_y2": 596.0029999999999, "r_x3": 62.067, "r_y3": 596.0029999999999, "coord_origin": "TOPLEFT"}, "text": "TableFormer uses ResNet-18 as the", "orig": "TableFormer uses ResNet-18 as the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 205.384, "r_y0": 604.412, "r_x1": 286.36, "r_y1": 604.412, "r_x2": 286.36, "r_y2": 595.8240000000001, "r_x3": 205.384, "r_y3": 595.8240000000001, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Net-", "orig": "CNN Backbone Net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 616.367, "r_x1": 70.037, "r_y1": 616.367, "r_x2": 70.037, "r_y2": 607.779, "r_x3": 50.112, "r_y3": 607.779, "coord_origin": "TOPLEFT"}, "text": "work", "orig": "work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 616.51, "r_x1": 72.528, "r_y1": 616.51, "r_x2": 72.528, "r_y2": 607.958, "r_x3": 70.037, "r_y3": 607.958, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 77.14, "r_y0": 616.51, "r_x1": 286.365, "r_y1": 616.51, "r_x2": 286.365, "r_y2": 607.958, "r_x3": 77.14, "r_y3": 607.958, "coord_origin": "TOPLEFT"}, "text": "The input images are resized to 448*448 pixels and", "orig": "The input images are resized to 448*448 pixels and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 628.465, "r_x1": 286.365, "r_y1": 628.465, "r_x2": 286.365, "r_y2": 619.913, "r_x3": 50.112, "r_y3": 619.913, "coord_origin": "TOPLEFT"}, "text": "the feature map has a dimension of 28*28. Additionally, we", "orig": "the feature map has a dimension of 28*28. Additionally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 640.421, "r_x1": 207.033, "r_y1": 640.421, "r_x2": 207.033, "r_y2": 631.869, "r_x3": 50.112, "r_y3": 631.869, "coord_origin": "TOPLEFT"}, "text": "enforce the following input constraints:", "orig": "enforce the following input constraints:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "formula", "bbox": {"l": 91.661, "t": 654.496, "r": 286.362, "b": 678.31, "coord_origin": "TOPLEFT"}, "confidence": 0.844183623790741, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.661, "r_y0": 663.366, "r_x1": 186.017, "r_y1": 663.366, "r_x2": 186.017, "r_y2": 654.814, "r_x3": 91.661, "r_y3": 654.814, "coord_origin": "TOPLEFT"}, "text": "Image width and height", "orig": "Image width and height", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 188.507, "r_y0": 663.06, "r_x1": 196.256, "r_y1": 663.06, "r_x2": 196.256, "r_y2": 654.496, "r_x3": 188.507, "r_y3": 654.496, "coord_origin": "TOPLEFT"}, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.746, "r_y0": 663.366, "r_x1": 244.813, "r_y1": 663.366, "r_x2": 244.813, "r_y2": 654.814, "r_x3": 198.746, "r_y3": 654.814, "coord_origin": "TOPLEFT"}, "text": "1024 pixels", "orig": "1024 pixels", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.016, "r_y0": 678.31, "r_x1": 186.246, "r_y1": 678.31, "r_x2": 186.246, "r_y2": 669.758, "r_x3": 101.016, "r_y3": 669.758, "coord_origin": "TOPLEFT"}, "text": "Structural tags length", "orig": "Structural tags length", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 188.736, "r_y0": 678.004, "r_x1": 196.485, "r_y1": 678.004, "r_x2": 196.485, "r_y2": 669.44, "r_x3": 188.736, "r_y3": 669.44, "coord_origin": "TOPLEFT"}, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.975, "r_y0": 678.31, "r_x1": 244.813, "r_y1": 678.31, "r_x2": 244.813, "r_y2": 669.758, "r_x3": 198.975, "r_y3": 669.758, "coord_origin": "TOPLEFT"}, "text": "512 tokens.", "orig": "512 tokens.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.746, "r_y0": 670.938, "r_x1": 286.362, "r_y1": 670.938, "r_x2": 286.362, "r_y2": 662.386, "r_x3": 274.746, "r_y3": 662.386, "coord_origin": "TOPLEFT"}, "text": "(2)", "orig": "(2)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 10, "label": "text", "bbox": {"l": 50.112, "t": 692.559, "r": 286.365, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9724979996681213, "cells": [{"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Although input constraints are used also by other methods,", "orig": "Although input constraints are used also by other methods,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "such as EDD, ours are less restrictive due to the improved", "orig": "such as EDD, ours are less restrictive due to the improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "text", "bbox": {"l": 308.862, "t": 75.47699999999998, "r": 545.115, "b": 107.93899999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9799237847328186, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 545.115, "r_y1": 84.029, "r_x2": 545.115, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "runtime performance and lower memory footprint of Table-", "orig": "runtime performance and lower memory footprint of Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 95.98400000000004, "r_x1": 339.985, "r_y1": 95.98400000000004, "r_x2": 339.985, "r_y2": 87.43200000000002, "r_x3": 308.862, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "Former.", "orig": "Former.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.889, "r_y0": 95.98400000000004, "r_x1": 545.115, "r_y1": 95.98400000000004, "r_x2": 545.115, "r_y2": 87.43200000000002, "r_x3": 346.889, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "This allows to utilize input samples with longer", "orig": "This allows to utilize input samples with longer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 107.93899999999996, "r_x1": 492.961, "r_y1": 107.93899999999996, "r_x2": 492.961, "r_y2": 99.38699999999994, "r_x3": 308.862, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "sequences and images with larger dimensions.", "orig": "sequences and images with larger dimensions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 308.862, "t": 116.49800000000005, "r": 545.115, "b": 328.288, "coord_origin": "TOPLEFT"}, "confidence": 0.9880930781364441, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 125.04999999999995, "r_x1": 545.115, "r_y1": 125.04999999999995, "r_x2": 545.115, "r_y2": 116.49800000000005, "r_x3": 320.817, "r_y3": 116.49800000000005, "coord_origin": "TOPLEFT"}, "text": "The Transformer Encoder consists of two 'Transformer", "orig": "The Transformer Encoder consists of two 'Transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 137.005, "r_x1": 545.115, "r_y1": 137.005, "r_x2": 545.115, "r_y2": 128.45299999999997, "r_x3": 308.862, "r_y3": 128.45299999999997, "coord_origin": "TOPLEFT"}, "text": "Encoder Layers', with an input feature size of 512, feed", "orig": "Encoder Layers', with an input feature size of 512, feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 148.96000000000004, "r_x1": 545.115, "r_y1": 148.96000000000004, "r_x2": 545.115, "r_y2": 140.40800000000002, "r_x3": 308.862, "r_y3": 140.40800000000002, "coord_origin": "TOPLEFT"}, "text": "forward network of 1024, and 4 attention heads. As for the", "orig": "forward network of 1024, and 4 attention heads. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 160.91499999999996, "r_x1": 545.115, "r_y1": 160.91499999999996, "r_x2": 545.115, "r_y2": 152.36300000000006, "r_x3": 308.862, "r_y3": 152.36300000000006, "coord_origin": "TOPLEFT"}, "text": "Transformer Decoder it is composed of four 'Transformer", "orig": "Transformer Decoder it is composed of four 'Transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 172.87, "r_x1": 545.115, "r_y1": 172.87, "r_x2": 545.115, "r_y2": 164.31799999999998, "r_x3": 308.862, "r_y3": 164.31799999999998, "coord_origin": "TOPLEFT"}, "text": "Decoder Layers' with similar input and output dimensions", "orig": "Decoder Layers' with similar input and output dimensions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 184.82600000000002, "r_x1": 317.161, "r_y1": 184.82600000000002, "r_x2": 317.161, "r_y2": 176.274, "r_x3": 308.862, "r_y3": 176.274, "coord_origin": "TOPLEFT"}, "text": "as", "orig": "as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 321.365, "r_y0": 184.82600000000002, "r_x1": 333.539, "r_y1": 184.82600000000002, "r_x2": 333.539, "r_y2": 176.274, "r_x3": 321.365, "r_y3": 176.274, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.734, "r_y0": 184.82600000000002, "r_x1": 467.218, "r_y1": 184.82600000000002, "r_x2": 467.218, "r_y2": 176.274, "r_x3": 337.734, "r_y3": 176.274, "coord_origin": "TOPLEFT"}, "text": "'Transformer Encoder Layers'.", "orig": "'Transformer Encoder Layers'.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.437, "r_y0": 184.82600000000002, "r_x1": 545.115, "r_y1": 184.82600000000002, "r_x2": 545.115, "r_y2": 176.274, "r_x3": 475.437, "r_y3": 176.274, "coord_origin": "TOPLEFT"}, "text": "Even though our", "orig": "Even though our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 196.78099999999995, "r_x1": 545.115, "r_y1": 196.78099999999995, "r_x2": 545.115, "r_y2": 188.22900000000004, "r_x3": 308.862, "r_y3": 188.22900000000004, "coord_origin": "TOPLEFT"}, "text": "model uses fewer layers and heads than the default imple-", "orig": "model uses fewer layers and heads than the default imple-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 208.736, "r_x1": 399.213, "r_y1": 208.736, "r_x2": 399.213, "r_y2": 200.18399999999997, "r_x3": 308.862, "r_y3": 200.18399999999997, "coord_origin": "TOPLEFT"}, "text": "mentation parameters,", "orig": "mentation parameters,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 403.965, "r_y0": 208.736, "r_x1": 458.63, "r_y1": 208.736, "r_x2": 458.63, "r_y2": 200.18399999999997, "r_x3": 403.965, "r_y3": 200.18399999999997, "coord_origin": "TOPLEFT"}, "text": "our extensive", "orig": "our extensive", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 462.934, "r_y0": 208.736, "r_x1": 545.115, "r_y1": 208.736, "r_x2": 545.115, "r_y2": 200.18399999999997, "r_x3": 462.934, "r_y3": 200.18399999999997, "coord_origin": "TOPLEFT"}, "text": "experimentation has", "orig": "experimentation has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 220.69100000000003, "r_x1": 527.84, "r_y1": 220.69100000000003, "r_x2": 527.84, "r_y2": 212.139, "r_x3": 308.862, "r_y3": 212.139, "coord_origin": "TOPLEFT"}, "text": "proved this setup to be more suitable for table images.", "orig": "proved this setup to be more suitable for table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.084, "r_y0": 220.69100000000003, "r_x1": 545.115, "r_y1": 220.69100000000003, "r_x2": 545.115, "r_y2": 212.139, "r_x3": 532.084, "r_y3": 212.139, "coord_origin": "TOPLEFT"}, "text": "We", "orig": "We", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 232.64599999999996, "r_x1": 341.868, "r_y1": 232.64599999999996, "r_x2": 341.868, "r_y2": 224.09400000000005, "r_x3": 308.862, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "attribute", "orig": "attribute", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.371, "r_y0": 232.64599999999996, "r_x1": 360.767, "r_y1": 232.64599999999996, "r_x2": 360.767, "r_y2": 224.09400000000005, "r_x3": 346.371, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.27, "r_y0": 232.64599999999996, "r_x1": 393.504, "r_y1": 232.64599999999996, "r_x2": 393.504, "r_y2": 224.09400000000005, "r_x3": 365.27, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "finding", "orig": "finding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.007, "r_y0": 232.64599999999996, "r_x1": 405.758, "r_y1": 232.64599999999996, "r_x2": 405.758, "r_y2": 224.09400000000005, "r_x3": 398.007, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.261, "r_y0": 232.64599999999996, "r_x1": 422.436, "r_y1": 232.64599999999996, "r_x2": 422.436, "r_y2": 224.09400000000005, "r_x3": 410.261, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.939, "r_y0": 232.64599999999996, "r_x1": 459.586, "r_y1": 232.64599999999996, "r_x2": 459.586, "r_y2": 224.09400000000005, "r_x3": 426.939, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "inherent", "orig": "inherent", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 464.089, "r_y0": 232.64599999999996, "r_x1": 490.102, "r_y1": 232.64599999999996, "r_x2": 490.102, "r_y2": 224.09400000000005, "r_x3": 464.089, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "design", "orig": "design", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 494.605, "r_y0": 232.64599999999996, "r_x1": 502.904, "r_y1": 232.64599999999996, "r_x2": 502.904, "r_y2": 224.09400000000005, "r_x3": 494.605, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 507.407, "r_y0": 232.64599999999996, "r_x1": 526.774, "r_y1": 232.64599999999996, "r_x2": 526.774, "r_y2": 224.09400000000005, "r_x3": 507.407, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 531.277, "r_y0": 232.64599999999996, "r_x1": 545.115, "r_y1": 232.64599999999996, "r_x2": 545.115, "r_y2": 224.09400000000005, "r_x3": 531.277, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "im-", "orig": "im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 244.601, "r_x1": 545.115, "r_y1": 244.601, "r_x2": 545.115, "r_y2": 236.04899999999998, "r_x3": 308.862, "r_y3": 236.04899999999998, "coord_origin": "TOPLEFT"}, "text": "ages, which contain mostly lines and text, unlike the more", "orig": "ages, which contain mostly lines and text, unlike the more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 256.557, "r_x1": 496.169, "r_y1": 256.557, "r_x2": 496.169, "r_y2": 248.005, "r_x3": 308.862, "r_y3": 248.005, "coord_origin": "TOPLEFT"}, "text": "elaborate content present in other scopes (e.g.", "orig": "elaborate content present in other scopes (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 501.897, "r_y0": 256.557, "r_x1": 545.115, "r_y1": 256.557, "r_x2": 545.115, "r_y2": 248.005, "r_x3": 501.897, "r_y3": 248.005, "coord_origin": "TOPLEFT"}, "text": "the COCO", "orig": "the COCO", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 268.51199999999994, "r_x1": 342.336, "r_y1": 268.51199999999994, "r_x2": 342.336, "r_y2": 259.96000000000004, "r_x3": 308.862, "r_y3": 259.96000000000004, "coord_origin": "TOPLEFT"}, "text": "dataset).", "orig": "dataset).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.952, "r_y0": 268.51199999999994, "r_x1": 545.115, "r_y1": 268.51199999999994, "r_x2": 545.115, "r_y2": 259.96000000000004, "r_x3": 348.952, "r_y3": 259.96000000000004, "coord_origin": "TOPLEFT"}, "text": "Moreover, we have added ResNet blocks to the", "orig": "Moreover, we have added ResNet blocks to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 280.467, "r_x1": 545.115, "r_y1": 280.467, "r_x2": 545.115, "r_y2": 271.91499999999996, "r_x3": 308.862, "r_y3": 271.91499999999996, "coord_origin": "TOPLEFT"}, "text": "inputs of the Structure Decoder and Cell BBox Decoder.", "orig": "inputs of the Structure Decoder and Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 292.422, "r_x1": 545.115, "r_y1": 292.422, "r_x2": 545.115, "r_y2": 283.87, "r_x3": 308.862, "r_y3": 283.87, "coord_origin": "TOPLEFT"}, "text": "This prevents a decoder having a stronger influence over the", "orig": "This prevents a decoder having a stronger influence over the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 304.377, "r_x1": 545.115, "r_y1": 304.377, "r_x2": 545.115, "r_y2": 295.825, "r_x3": 308.862, "r_y3": 295.825, "coord_origin": "TOPLEFT"}, "text": "learned weights which would damage the other prediction", "orig": "learned weights which would damage the other prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 316.332, "r_x1": 545.115, "r_y1": 316.332, "r_x2": 545.115, "r_y2": 307.78, "r_x3": 308.862, "r_y3": 307.78, "coord_origin": "TOPLEFT"}, "text": "task (structure vs bounding boxes), but learn task specific", "orig": "task (structure vs bounding boxes), but learn task specific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 328.288, "r_x1": 532.483, "r_y1": 328.288, "r_x2": 532.483, "r_y2": 319.736, "r_x3": 308.862, "r_y3": 319.736, "coord_origin": "TOPLEFT"}, "text": "weights instead. Lastly our dropout layers are set to 0.5.", "orig": "weights instead. Lastly our dropout layers are set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 308.862, "t": 336.846, "r": 545.115, "b": 429.084, "coord_origin": "TOPLEFT"}, "confidence": 0.9877589344978333, "cells": [{"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 345.398, "r_x1": 545.115, "r_y1": 345.398, "r_x2": 545.115, "r_y2": 336.846, "r_x3": 320.817, "r_y3": 336.846, "coord_origin": "TOPLEFT"}, "text": "For training, TableFormer is trained with 3 Adam opti-", "orig": "For training, TableFormer is trained with 3 Adam opti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 357.353, "r_x1": 403.736, "r_y1": 357.353, "r_x2": 403.736, "r_y2": 348.801, "r_x3": 308.862, "r_y3": 348.801, "coord_origin": "TOPLEFT"}, "text": "mizers, each one for the", "orig": "mizers, each one for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 406.076, "r_y0": 357.21, "r_x1": 545.112, "r_y1": 357.21, "r_x2": 545.112, "r_y2": 348.622, "r_x3": 406.076, "r_y3": 348.622, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network Structure", "orig": "CNN Backbone Network Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 503.539, "r_y0": 357.353, "r_x1": 506.03, "r_y1": 357.353, "r_x2": 506.03, "r_y2": 348.801, "r_x3": 503.539, "r_y3": 348.801, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 369.165, "r_x1": 343.163, "r_y1": 369.165, "r_x2": 343.163, "r_y2": 360.577, "r_x3": 308.862, "r_y3": 360.577, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 343.163, "r_y0": 369.308, "r_x1": 362.202, "r_y1": 369.308, "r_x2": 362.202, "r_y2": 360.756, "r_x3": 343.163, "r_y3": 360.756, "coord_origin": "TOPLEFT"}, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 364.286, "r_y0": 369.165, "r_x1": 440.938, "r_y1": 369.165, "r_x2": 440.938, "r_y2": 360.577, "r_x3": 364.286, "r_y3": 360.577, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.939, "r_y0": 369.308, "r_x1": 443.43, "r_y1": 369.308, "r_x2": 443.43, "r_y2": 360.756, "r_x3": 440.939, "r_y3": 360.756, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 446.379, "r_y0": 369.308, "r_x1": 545.108, "r_y1": 369.308, "r_x2": 545.108, "r_y2": 360.756, "r_x3": 446.379, "r_y3": 360.756, "coord_origin": "TOPLEFT"}, "text": "Taking the PubTabNet as", "orig": "Taking the PubTabNet as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 381.263, "r_x1": 545.115, "r_y1": 381.263, "r_x2": 545.115, "r_y2": 372.711, "r_x3": 308.862, "r_y3": 372.711, "coord_origin": "TOPLEFT"}, "text": "an example for our parameter set up, the initializing learn-", "orig": "an example for our parameter set up, the initializing learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 393.219, "r_x1": 545.115, "r_y1": 393.219, "r_x2": 545.115, "r_y2": 384.667, "r_x3": 308.862, "r_y3": 384.667, "coord_origin": "TOPLEFT"}, "text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 405.01, "r_x1": 314.673, "r_y1": 405.01, "r_x2": 314.673, "r_y2": 396.304, "r_x3": 308.862, "r_y3": 396.304, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.658, "r_y0": 405.174, "r_x1": 329.726, "r_y1": 405.174, "r_x2": 329.726, "r_y2": 396.622, "r_x3": 318.658, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "set", "orig": "set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.711, "r_y0": 405.174, "r_x1": 341.462, "r_y1": 405.174, "r_x2": 341.462, "r_y2": 396.622, "r_x3": 333.711, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.447, "r_y0": 405.174, "r_x1": 360.391, "r_y1": 405.174, "r_x2": 360.391, "r_y2": 396.622, "r_x3": 345.447, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "0.5.", "orig": "0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.963, "r_y0": 405.174, "r_x1": 415.166, "r_y1": 405.174, "r_x2": 415.166, "r_y2": 396.622, "r_x3": 367.963, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "Afterwards,", "orig": "Afterwards,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 419.519, "r_y0": 405.174, "r_x1": 545.108, "r_y1": 405.174, "r_x2": 545.108, "r_y2": 396.622, "r_x3": 419.519, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "we reduce the learning rate to", "orig": "we reduce the learning rate to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 417.129, "r_x1": 545.115, "r_y1": 417.129, "r_x2": 545.115, "r_y2": 408.577, "r_x3": 308.862, "r_y3": 408.577, "coord_origin": "TOPLEFT"}, "text": "0.0001, the batch size to 18 and train for 12 more epochs or", "orig": "0.0001, the batch size to 18 and train for 12 more epochs or", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 429.084, "r_x1": 360.966, "r_y1": 429.084, "r_x2": 360.966, "r_y2": 420.532, "r_x3": 308.862, "r_y3": 420.532, "coord_origin": "TOPLEFT"}, "text": "convergence.", "orig": "convergence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 308.862, "t": 437.643, "r": 545.115, "b": 553.7909999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9884491562843323, "cells": [{"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 446.195, "r_x1": 545.115, "r_y1": 446.195, "r_x2": 545.115, "r_y2": 437.643, "r_x3": 320.817, "r_y3": 437.643, "coord_origin": "TOPLEFT"}, "text": "TableFormer is implemented with PyTorch and Torchvi-", "orig": "TableFormer is implemented with PyTorch and Torchvi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 458.15, "r_x1": 384.628, "r_y1": 458.15, "r_x2": 384.628, "r_y2": 449.598, "r_x3": 308.862, "r_y3": 449.598, "coord_origin": "TOPLEFT"}, "text": "sion libraries [22].", "orig": "sion libraries [22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.372, "r_y0": 458.15, "r_x1": 545.115, "r_y1": 458.15, "r_x2": 545.115, "r_y2": 449.598, "r_x3": 391.372, "r_y3": 449.598, "coord_origin": "TOPLEFT"}, "text": "To speed up the inference, the image", "orig": "To speed up the inference, the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 470.105, "r_x1": 494.007, "r_y1": 470.105, "r_x2": 494.007, "r_y2": 461.553, "r_x3": 308.862, "r_y3": 461.553, "coord_origin": "TOPLEFT"}, "text": "undergoes a single forward pass through the", "orig": "undergoes a single forward pass through the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.078, "r_y0": 469.962, "r_x1": 545.111, "r_y1": 469.962, "r_x2": 545.111, "r_y2": 461.374, "r_x3": 498.078, "r_y3": 461.374, "coord_origin": "TOPLEFT"}, "text": "CNN Back-", "orig": "CNN Back-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 481.917, "r_x1": 364.443, "r_y1": 481.917, "r_x2": 364.443, "r_y2": 473.329, "r_x3": 308.862, "r_y3": 473.329, "coord_origin": "TOPLEFT"}, "text": "bone Network", "orig": "bone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.061, "r_y0": 482.06, "r_x1": 545.113, "r_y1": 482.06, "r_x2": 545.113, "r_y2": 473.508, "r_x3": 367.061, "r_y3": 473.508, "coord_origin": "TOPLEFT"}, "text": "and transformer encoder. This eliminates the", "orig": "and transformer encoder. This eliminates the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 494.015, "r_x1": 545.115, "r_y1": 494.015, "r_x2": 545.115, "r_y2": 485.463, "r_x3": 308.862, "r_y3": 485.463, "coord_origin": "TOPLEFT"}, "text": "overhead of generating the same features for each decoding", "orig": "overhead of generating the same features for each decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 505.97, "r_x1": 545.115, "r_y1": 505.97, "r_x2": 545.115, "r_y2": 497.418, "r_x3": 308.862, "r_y3": 497.418, "coord_origin": "TOPLEFT"}, "text": "step. Similarly, we employ a 'caching' technique to preform", "orig": "step. Similarly, we employ a 'caching' technique to preform", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 517.9259999999999, "r_x1": 432.588, "r_y1": 517.9259999999999, "r_x2": 432.588, "r_y2": 509.374, "r_x3": 308.862, "r_y3": 509.374, "coord_origin": "TOPLEFT"}, "text": "faster autoregressive decoding.", "orig": "faster autoregressive decoding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 517.9259999999999, "r_x1": 545.115, "r_y1": 517.9259999999999, "r_x2": 545.115, "r_y2": 509.374, "r_x3": 436.732, "r_y3": 509.374, "coord_origin": "TOPLEFT"}, "text": "This is achieved by storing", "orig": "This is achieved by storing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 529.881, "r_x1": 545.115, "r_y1": 529.881, "r_x2": 545.115, "r_y2": 521.329, "r_x3": 308.862, "r_y3": 521.329, "coord_origin": "TOPLEFT"}, "text": "the features of decoded tokens so we can reuse them for", "orig": "the features of decoded tokens so we can reuse them for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 541.836, "r_x1": 370.062, "r_y1": 541.836, "r_x2": 370.062, "r_y2": 533.284, "r_x3": 308.862, "r_y3": 533.284, "coord_origin": "TOPLEFT"}, "text": "each time step.", "orig": "each time step.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.721, "r_y0": 541.836, "r_x1": 545.115, "r_y1": 541.836, "r_x2": 545.115, "r_y2": 533.284, "r_x3": 375.721, "r_y3": 533.284, "coord_origin": "TOPLEFT"}, "text": "Therefore, we only compute the attention", "orig": "Therefore, we only compute the attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 553.7909999999999, "r_x1": 377.215, "r_y1": 553.7909999999999, "r_x2": 377.215, "r_y2": 545.239, "r_x3": 308.862, "r_y3": 545.239, "coord_origin": "TOPLEFT"}, "text": "for each new tag.", "orig": "for each new tag.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "section_header", "bbox": {"l": 308.862, "t": 579.554, "r": 397.443, "b": 589.406, "coord_origin": "TOPLEFT"}, "confidence": 0.9450808763504028, "cells": [{"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 589.406, "r_x1": 397.443, "r_y1": 589.406, "r_x2": 397.443, "r_y2": 579.554, "r_x3": 308.862, "r_y3": 579.554, "coord_origin": "TOPLEFT"}, "text": "5.2. Generalization", "orig": "5.2. Generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 308.862, "t": 603.718, "r": 545.115, "b": 672.046, "coord_origin": "TOPLEFT"}, "confidence": 0.9880595803260803, "cells": [{"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 612.27, "r_x1": 545.115, "r_y1": 612.27, "r_x2": 545.115, "r_y2": 603.718, "r_x3": 320.817, "r_y3": 603.718, "coord_origin": "TOPLEFT"}, "text": "TableFormer is evaluated on three major publicly avail-", "orig": "TableFormer is evaluated on three major publicly avail-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 624.225, "r_x1": 545.115, "r_y1": 624.225, "r_x2": 545.115, "r_y2": 615.673, "r_x3": 308.862, "r_y3": 615.673, "coord_origin": "TOPLEFT"}, "text": "able datasets of different nature to prove the generalization", "orig": "able datasets of different nature to prove the generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 636.1800000000001, "r_x1": 545.115, "r_y1": 636.1800000000001, "r_x2": 545.115, "r_y2": 627.6279999999999, "r_x3": 308.862, "r_y3": 627.6279999999999, "coord_origin": "TOPLEFT"}, "text": "and effectiveness of our model. The datasets used for eval-", "orig": "and effectiveness of our model. The datasets used for eval-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 648.135, "r_x1": 545.115, "r_y1": 648.135, "r_x2": 545.115, "r_y2": 639.583, "r_x3": 308.862, "r_y3": 639.583, "coord_origin": "TOPLEFT"}, "text": "uation are the PubTabNet, FinTabNet and TableBank which", "orig": "uation are the PubTabNet, FinTabNet and TableBank which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 660.091, "r_x1": 545.115, "r_y1": 660.091, "r_x2": 545.115, "r_y2": 651.539, "r_x3": 308.862, "r_y3": 651.539, "coord_origin": "TOPLEFT"}, "text": "stem from the scientific, financial and general domains re-", "orig": "stem from the scientific, financial and general domains re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 672.046, "r_x1": 350.705, "r_y1": 672.046, "r_x2": 350.705, "r_y2": 663.494, "r_x3": 308.862, "r_y3": 663.494, "coord_origin": "TOPLEFT"}, "text": "spectively.", "orig": "spectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "text", "bbox": {"l": 308.862, "t": 680.604, "r": 545.115, "b": 713.067, "coord_origin": "TOPLEFT"}, "confidence": 0.9830910563468933, "cells": [{"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 320.817, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "We also share our baseline results on the challenging", "orig": "We also share our baseline results on the challenging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 361.196, "r_y1": 701.111, "r_x2": 361.196, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 203, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.057, "r_y0": 701.111, "r_x1": 396.214, "r_y1": 701.111, "r_x2": 396.214, "r_y2": 692.559, "r_x3": 366.057, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "dataset.", "orig": "dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 204, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 406.406, "r_y0": 701.111, "r_x1": 453.449, "r_y1": 701.111, "r_x2": 453.449, "r_y2": 692.559, "r_x3": 406.406, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Throughout", "orig": "Throughout", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 205, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.311, "r_y0": 701.111, "r_x1": 471.591, "r_y1": 701.111, "r_x2": 471.591, "r_y2": 692.559, "r_x3": 458.311, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 206, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.453, "r_y0": 701.111, "r_x1": 527.481, "r_y1": 701.111, "r_x2": 527.481, "r_y2": 692.559, "r_x3": 476.453, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "experiments,", "orig": "experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 207, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.941, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 532.941, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 208, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.067, "r_x1": 495.94, "r_y1": 713.067, "r_x2": 495.94, "r_y2": 704.515, "r_x3": 308.862, "r_y3": 704.515, "coord_origin": "TOPLEFT"}, "text": "same parameters stated in Sec. 5.1 are utilized.", "orig": "same parameters stated in Sec. 5.1 are utilized.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8820409178733826, "cells": [{"index": 209, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "text", "id": 5, "page_no": 5, "cluster": {"id": 5, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 286.365, "b": 155.76, "coord_origin": "TOPLEFT"}, "confidence": 0.9868090152740479, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "tention encoding is then multiplied to the encoded image to", "orig": "tention encoding is then multiplied to the encoded image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 95.98400000000004, "r_x1": 286.365, "r_y1": 95.98400000000004, "r_x2": 286.365, "r_y2": 87.43200000000002, "r_x3": 50.112, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "produce a feature for each table cell. Notice that this is dif-", "orig": "produce a feature for each table cell. Notice that this is dif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 107.93899999999996, "r_x1": 286.365, "r_y1": 107.93899999999996, "r_x2": 286.365, "r_y2": 99.38699999999994, "r_x3": 50.112, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "ferent than the typical object detection problem where im-", "orig": "ferent than the typical object detection problem where im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 119.894, "r_x1": 286.365, "r_y1": 119.894, "r_x2": 286.365, "r_y2": 111.34199999999998, "r_x3": 50.112, "r_y3": 111.34199999999998, "coord_origin": "TOPLEFT"}, "text": "balances between the number of detections and the amount", "orig": "balances between the number of detections and the amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 131.84900000000005, "r_x1": 135.691, "r_y1": 131.84900000000005, "r_x2": 135.691, "r_y2": 123.29700000000003, "r_x3": 50.112, "r_y3": 123.29700000000003, "coord_origin": "TOPLEFT"}, "text": "of objects may exist.", "orig": "of objects may exist.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.047, "r_y0": 131.84900000000005, "r_x1": 286.365, "r_y1": 131.84900000000005, "r_x2": 286.365, "r_y2": 123.29700000000003, "r_x3": 142.047, "r_y3": 123.29700000000003, "coord_origin": "TOPLEFT"}, "text": "In our case, we know up front that", "orig": "In our case, we know up front that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 143.80499999999995, "r_x1": 286.365, "r_y1": 143.80499999999995, "r_x2": 286.365, "r_y2": 135.25300000000004, "r_x3": 50.112, "r_y3": 135.25300000000004, "coord_origin": "TOPLEFT"}, "text": "the produced detections always match with the table cells", "orig": "the produced detections always match with the table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 155.76, "r_x1": 175.163, "r_y1": 155.76, "r_x2": 175.163, "r_y2": 147.20799999999997, "r_x3": 50.112, "r_y3": 147.20799999999997, "coord_origin": "TOPLEFT"}, "text": "in number and correspondence.", "orig": "in number and correspondence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "tention encoding is then multiplied to the encoded image to produce a feature for each table cell. Notice that this is different than the typical object detection problem where imbalances between the number of detections and the amount of objects may exist. In our case, we know up front that the produced detections always match with the table cells in number and correspondence."}, {"label": "text", "id": 6, "page_no": 5, "cluster": {"id": 6, "label": "text", "bbox": {"l": 50.112, "t": 159.89300000000003, "r": 286.365, "b": 240.17700000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9860327839851379, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 168.44500000000005, "r_x1": 108.154, "r_y1": 168.44500000000005, "r_x2": 108.154, "r_y2": 159.89300000000003, "r_x3": 62.067, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "The output", "orig": "The output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.275, "r_y0": 168.44500000000005, "r_x1": 144.806, "r_y1": 168.44500000000005, "r_x2": 144.806, "r_y2": 159.89300000000003, "r_x3": 113.275, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "features", "orig": "features", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.937, "r_y0": 168.44500000000005, "r_x1": 161.554, "r_y1": 168.44500000000005, "r_x2": 161.554, "r_y2": 159.89300000000003, "r_x3": 149.937, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.684, "r_y0": 168.44500000000005, "r_x1": 184.936, "r_y1": 168.44500000000005, "r_x2": 184.936, "r_y2": 159.89300000000003, "r_x3": 166.684, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "each", "orig": "each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 190.057, "r_y0": 168.44500000000005, "r_x1": 209.424, "r_y1": 168.44500000000005, "r_x2": 209.424, "r_y2": 159.89300000000003, "r_x3": 190.057, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.555, "r_y0": 168.44500000000005, "r_x1": 228.941, "r_y1": 168.44500000000005, "r_x2": 228.941, "r_y2": 159.89300000000003, "r_x3": 214.555, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "cell", "orig": "cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.061, "r_y0": 168.44500000000005, "r_x1": 246.226, "r_y1": 168.44500000000005, "r_x2": 246.226, "r_y2": 159.89300000000003, "r_x3": 234.061, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "are", "orig": "are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.356, "r_y0": 168.44500000000005, "r_x1": 268.512, "r_y1": 168.44500000000005, "r_x2": 268.512, "r_y2": 159.89300000000003, "r_x3": 251.356, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "then", "orig": "then", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 273.643, "r_y0": 168.44500000000005, "r_x1": 286.365, "r_y1": 168.44500000000005, "r_x2": 286.365, "r_y2": 159.89300000000003, "r_x3": 273.643, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "fed", "orig": "fed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 180.40099999999995, "r_x1": 65.614, "r_y1": 180.40099999999995, "r_x2": 65.614, "r_y2": 171.84900000000005, "r_x3": 50.112, "r_y3": 171.84900000000005, "coord_origin": "TOPLEFT"}, "text": "into", "orig": "into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.107, "r_y0": 180.40099999999995, "r_x1": 82.281, "r_y1": 180.40099999999995, "r_x2": 82.281, "r_y2": 171.84900000000005, "r_x3": 70.107, "r_y3": 171.84900000000005, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.764, "r_y0": 180.40099999999995, "r_x1": 138.66, "r_y1": 180.40099999999995, "r_x2": 138.66, "r_y2": 171.84900000000005, "r_x3": 86.764, "r_y3": 171.84900000000005, "coord_origin": "TOPLEFT"}, "text": "feed-forward", "orig": "feed-forward", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.153, "r_y0": 180.40099999999995, "r_x1": 286.365, "r_y1": 180.40099999999995, "r_x2": 286.365, "r_y2": 171.84900000000005, "r_x3": 143.153, "r_y3": 171.84900000000005, "coord_origin": "TOPLEFT"}, "text": "network (FFN). The FFN consists", "orig": "network (FFN). The FFN consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 192.356, "r_x1": 286.365, "r_y1": 192.356, "r_x2": 286.365, "r_y2": 183.80399999999997, "r_x3": 50.112, "r_y3": 183.80399999999997, "coord_origin": "TOPLEFT"}, "text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 204.31100000000004, "r_x1": 286.365, "r_y1": 204.31100000000004, "r_x2": 286.365, "r_y2": 195.75900000000001, "r_x3": 50.112, "r_y3": 195.75900000000001, "coord_origin": "TOPLEFT"}, "text": "tion function) that predicts the normalized coordinates for", "orig": "tion function) that predicts the normalized coordinates for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 216.26599999999996, "r_x1": 196.004, "r_y1": 216.26599999999996, "r_x2": 196.004, "r_y2": 207.71400000000006, "r_x3": 50.112, "r_y3": 207.71400000000006, "coord_origin": "TOPLEFT"}, "text": "the bounding box of each table cell.", "orig": "the bounding box of each table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.786, "r_y0": 216.26599999999996, "r_x1": 286.365, "r_y1": 216.26599999999996, "r_x2": 286.365, "r_y2": 207.71400000000006, "r_x3": 200.786, "r_y3": 207.71400000000006, "coord_origin": "TOPLEFT"}, "text": "Finally, the predicted", "orig": "Finally, the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 228.221, "r_x1": 286.365, "r_y1": 228.221, "r_x2": 286.365, "r_y2": 219.66899999999998, "r_x3": 50.112, "r_y3": 219.66899999999998, "coord_origin": "TOPLEFT"}, "text": "bounding boxes are classified based on whether they are", "orig": "bounding boxes are classified based on whether they are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 240.17700000000002, "r_x1": 181.549, "r_y1": 240.17700000000002, "r_x2": 181.549, "r_y2": 231.625, "r_x3": 50.112, "r_y3": 231.625, "coord_origin": "TOPLEFT"}, "text": "empty or not using a linear layer.", "orig": "empty or not using a linear layer.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The output features for each table cell are then fed into the feed-forward network (FFN). The FFN consists of a Multi-Layer Perceptron (3 layers with ReLU activation function) that predicts the normalized coordinates for the bounding box of each table cell. Finally, the predicted bounding boxes are classified based on whether they are empty or not using a linear layer."}, {"label": "text", "id": 4, "page_no": 5, "cluster": {"id": 4, "label": "text", "bbox": {"l": 50.112, "t": 243.92200000000003, "r": 286.366, "b": 444.145, "coord_origin": "TOPLEFT"}, "confidence": 0.9873637557029724, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 252.87800000000004, "r_x1": 129.215, "r_y1": 252.87800000000004, "r_x2": 129.215, "r_y2": 243.92200000000003, "r_x3": 62.067, "r_y3": 243.92200000000003, "coord_origin": "TOPLEFT"}, "text": "Loss Functions.", "orig": "Loss Functions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.451, "r_y0": 252.86199999999997, "r_x1": 276.139, "r_y1": 252.86199999999997, "r_x2": 276.139, "r_y2": 244.30999999999995, "r_x3": 134.451, "r_y3": 244.30999999999995, "coord_origin": "TOPLEFT"}, "text": "We formulate a multi-task loss Eq.", "orig": "We formulate a multi-task loss Eq.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.379, "r_y0": 252.86199999999997, "r_x1": 286.361, "r_y1": 252.86199999999997, "r_x2": 286.361, "r_y2": 244.30999999999995, "r_x3": 281.379, "r_y3": 244.30999999999995, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 264.817, "r_x1": 134.685, "r_y1": 264.817, "r_x2": 134.685, "r_y2": 256.265, "r_x3": 50.112, "r_y3": 256.265, "coord_origin": "TOPLEFT"}, "text": "to train our network.", "orig": "to train our network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.543, "r_y0": 264.817, "r_x1": 286.365, "r_y1": 264.817, "r_x2": 286.365, "r_y2": 256.265, "r_x3": 140.543, "r_y3": 256.265, "coord_origin": "TOPLEFT"}, "text": "The Cross-Entropy loss (denoted as", "orig": "The Cross-Entropy loss (denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 276.60900000000004, "r_x1": 53.085, "r_y1": 276.60900000000004, "r_x2": 53.085, "r_y2": 267.903, "r_x3": 50.112, "r_y3": 267.903, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.085, "r_y0": 277.53200000000004, "r_x1": 56.845, "r_y1": 277.53200000000004, "r_x2": 56.845, "r_y2": 271.438, "r_x3": 53.085, "r_y3": 271.438, "coord_origin": "TOPLEFT"}, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 57.343, "r_y0": 276.773, "r_x1": 135.4, "r_y1": 276.773, "r_x2": 135.4, "r_y2": 268.221, "r_x3": 57.343, "r_y3": 268.221, "coord_origin": "TOPLEFT"}, "text": ") is used to train the", "orig": ") is used to train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.735, "r_y0": 276.63, "r_x1": 211.08, "r_y1": 276.63, "r_x2": 211.08, "r_y2": 268.04200000000003, "r_x3": 137.735, "r_y3": 268.04200000000003, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 213.637, "r_y0": 276.773, "r_x1": 286.364, "r_y1": 276.773, "r_x2": 286.364, "r_y2": 268.221, "r_x3": 213.637, "r_y3": 268.221, "coord_origin": "TOPLEFT"}, "text": "which predicts the", "orig": "which predicts the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 288.728, "r_x1": 158.824, "r_y1": 288.728, "r_x2": 158.824, "r_y2": 280.176, "r_x3": 50.112, "r_y3": 280.176, "coord_origin": "TOPLEFT"}, "text": "structure tokens. As for the", "orig": "structure tokens. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.318, "r_y0": 288.585, "r_x1": 238.797, "r_y1": 288.585, "r_x2": 238.797, "r_y2": 279.99699999999996, "r_x3": 161.318, "r_y3": 279.99699999999996, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.521, "r_y0": 288.728, "r_x1": 286.363, "r_y1": 288.728, "r_x2": 286.363, "r_y2": 280.176, "r_x3": 241.521, "r_y3": 280.176, "coord_origin": "TOPLEFT"}, "text": "it is trained", "orig": "it is trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 300.683, "r_x1": 211.377, "r_y1": 300.683, "r_x2": 211.377, "r_y2": 292.131, "r_x3": 50.112, "r_y3": 292.131, "coord_origin": "TOPLEFT"}, "text": "with a combination of losses denoted as", "orig": "with a combination of losses denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.271, "r_y0": 300.519, "r_x1": 217.244, "r_y1": 300.519, "r_x2": 217.244, "r_y2": 291.813, "r_x3": 214.271, "r_y3": 291.813, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.244, "r_y0": 301.442, "r_x1": 229.198, "r_y1": 301.442, "r_x2": 229.198, "r_y2": 295.348, "r_x3": 217.244, "r_y3": 295.348, "coord_origin": "TOPLEFT"}, "text": "box", "orig": "box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.696, "r_y0": 300.683, "r_x1": 232.187, "r_y1": 300.683, "r_x2": 232.187, "r_y2": 292.131, "r_x3": 229.696, "r_y3": 292.131, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.49, "r_y0": 300.519, "r_x1": 239.463, "r_y1": 300.519, "r_x2": 239.463, "r_y2": 291.813, "r_x3": 236.49, "r_y3": 291.813, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.463, "r_y0": 301.442, "r_x1": 251.417, "r_y1": 301.442, "r_x2": 251.417, "r_y2": 295.348, "r_x3": 239.463, "r_y3": 295.348, "coord_origin": "TOPLEFT"}, "text": "box", "orig": "box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 254.811, "r_y0": 300.683, "r_x1": 286.363, "r_y1": 300.683, "r_x2": 286.363, "r_y2": 292.131, "r_x3": 254.811, "r_y3": 292.131, "coord_origin": "TOPLEFT"}, "text": "consists", "orig": "consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 312.638, "r_x1": 137.454, "r_y1": 312.638, "r_x2": 137.454, "r_y2": 304.086, "r_x3": 50.112, "r_y3": 304.086, "coord_origin": "TOPLEFT"}, "text": "of the generally used", "orig": "of the generally used", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.298, "r_y0": 312.474, "r_x1": 144.271, "r_y1": 312.474, "r_x2": 144.271, "r_y2": 303.768, "r_x3": 141.298, "r_y3": 303.768, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 144.271, "r_y0": 313.398, "r_x1": 148.243, "r_y1": 313.398, "r_x2": 148.243, "r_y2": 307.304, "r_x3": 144.271, "r_y3": 307.304, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.586, "r_y0": 312.638, "r_x1": 286.364, "r_y1": 312.638, "r_x2": 286.364, "r_y2": 304.086, "r_x3": 152.586, "r_y3": 304.086, "coord_origin": "TOPLEFT"}, "text": "loss for object detection and the", "orig": "loss for object detection and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 324.593, "r_x1": 89.683, "r_y1": 324.593, "r_x2": 89.683, "r_y2": 316.041, "r_x3": 50.112, "r_y3": 316.041, "coord_origin": "TOPLEFT"}, "text": "IoU loss (", "orig": "IoU loss (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 89.686, "r_y0": 324.429, "r_x1": 92.659, "r_y1": 324.429, "r_x2": 92.659, "r_y2": 315.723, "r_x3": 89.686, "r_y3": 315.723, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.659, "r_y0": 325.353, "r_x1": 104.12, "r_y1": 325.353, "r_x2": 104.12, "r_y2": 319.259, "r_x3": 92.659, "r_y3": 319.259, "coord_origin": "TOPLEFT"}, "text": "iou", "orig": "iou", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 104.618, "r_y0": 324.593, "r_x1": 286.366, "r_y1": 324.593, "r_x2": 286.366, "r_y2": 316.041, "r_x3": 104.618, "r_y3": 316.041, "coord_origin": "TOPLEFT"}, "text": ") to be scale invariant as explained in [25]. In", "orig": ") to be scale invariant as explained in [25]. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 336.549, "r_x1": 286.365, "r_y1": 336.549, "r_x2": 286.365, "r_y2": 327.997, "r_x3": 50.112, "r_y3": 327.997, "coord_origin": "TOPLEFT"}, "text": "comparison to DETR, we do not use the Hungarian algo-", "orig": "comparison to DETR, we do not use the Hungarian algo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 348.504, "r_x1": 286.365, "r_y1": 348.504, "r_x2": 286.365, "r_y2": 339.952, "r_x3": 50.112, "r_y3": 339.952, "coord_origin": "TOPLEFT"}, "text": "rithm [15] to match the predicted bounding boxes with the", "orig": "rithm [15] to match the predicted bounding boxes with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 360.459, "r_x1": 286.365, "r_y1": 360.459, "r_x2": 286.365, "r_y2": 351.907, "r_x3": 50.112, "r_y3": 351.907, "coord_origin": "TOPLEFT"}, "text": "ground-truth boxes, as we have already achieved a one-to-", "orig": "ground-truth boxes, as we have already achieved a one-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 372.414, "r_x1": 286.365, "r_y1": 372.414, "r_x2": 286.365, "r_y2": 363.862, "r_x3": 50.112, "r_y3": 363.862, "coord_origin": "TOPLEFT"}, "text": "one match through two steps: 1) Our token input sequence", "orig": "one match through two steps: 1) Our token input sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 384.369, "r_x1": 286.365, "r_y1": 384.369, "r_x2": 286.365, "r_y2": 375.817, "r_x3": 50.112, "r_y3": 375.817, "coord_origin": "TOPLEFT"}, "text": "is naturally ordered, therefore the hidden states of the table", "orig": "is naturally ordered, therefore the hidden states of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 396.324, "r_x1": 286.365, "r_y1": 396.324, "r_x2": 286.365, "r_y2": 387.772, "r_x3": 50.112, "r_y3": 387.772, "coord_origin": "TOPLEFT"}, "text": "data cells are also in order when they are provided as in-", "orig": "data cells are also in order when they are provided as in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 408.28, "r_x1": 88.687, "r_y1": 408.28, "r_x2": 88.687, "r_y2": 399.728, "r_x3": 50.112, "r_y3": 399.728, "coord_origin": "TOPLEFT"}, "text": "put to the", "orig": "put to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.646, "r_y0": 408.137, "r_x1": 170.052, "r_y1": 408.137, "r_x2": 170.052, "r_y2": 399.549, "r_x3": 91.646, "r_y3": 399.549, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.051, "r_y0": 408.28, "r_x1": 172.542, "r_y1": 408.28, "r_x2": 172.542, "r_y2": 399.728, "r_x3": 170.051, "r_y3": 399.728, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.62, "r_y0": 408.28, "r_x1": 286.364, "r_y1": 408.28, "r_x2": 286.364, "r_y2": 399.728, "r_x3": 175.62, "r_y3": 399.728, "coord_origin": "TOPLEFT"}, "text": "and 2) Our bounding boxes", "orig": "and 2) Our bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 420.235, "r_x1": 181.967, "r_y1": 420.235, "r_x2": 181.967, "r_y2": 411.683, "r_x3": 50.112, "r_y3": 411.683, "coord_origin": "TOPLEFT"}, "text": "generation mechanism (see Sec.", "orig": "generation mechanism (see Sec.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 189.09, "r_y0": 420.235, "r_x1": 286.365, "r_y1": 420.235, "r_x2": 286.365, "r_y2": 411.683, "r_x3": 189.09, "r_y3": 411.683, "coord_origin": "TOPLEFT"}, "text": "3) ensures a one-to-one", "orig": "3) ensures a one-to-one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 432.19, "r_x1": 286.365, "r_y1": 432.19, "r_x2": 286.365, "r_y2": 423.638, "r_x3": 50.112, "r_y3": 423.638, "coord_origin": "TOPLEFT"}, "text": "mapping between the cell content and its bounding box for", "orig": "mapping between the cell content and its bounding box for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 444.145, "r_x1": 158.296, "r_y1": 444.145, "r_x2": 158.296, "r_y2": 435.593, "r_x3": 50.112, "r_y3": 435.593, "coord_origin": "TOPLEFT"}, "text": "all post-processed datasets.", "orig": "all post-processed datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Loss Functions. We formulate a multi-task loss Eq. 2 to train our network. The Cross-Entropy loss (denoted as l s ) is used to train the Structure Decoder which predicts the structure tokens. As for the Cell BBox Decoder it is trained with a combination of losses denoted as l box . l box consists of the generally used l 1 loss for object detection and the IoU loss ( l iou ) to be scale invariant as explained in [25]. In comparison to DETR, we do not use the Hungarian algorithm [15] to match the predicted bounding boxes with the ground-truth boxes, as we have already achieved a one-toone match through two steps: 1) Our token input sequence is naturally ordered, therefore the hidden states of the table data cells are also in order when they are provided as input to the Cell BBox Decoder , and 2) Our bounding boxes generation mechanism (see Sec. 3) ensures a one-to-one mapping between the cell content and its bounding box for all post-processed datasets."}, {"label": "text", "id": 11, "page_no": 5, "cluster": {"id": 11, "label": "text", "bbox": {"l": 50.112, "t": 448.279, "r": 286.365, "b": 468.786, "coord_origin": "TOPLEFT"}, "confidence": 0.9724196195602417, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 456.831, "r_x1": 286.365, "r_y1": 456.831, "r_x2": 286.365, "r_y2": 448.279, "r_x3": 62.067, "r_y3": 448.279, "coord_origin": "TOPLEFT"}, "text": "The loss used to train the TableFormer can be defined as", "orig": "The loss used to train the TableFormer can be defined as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 468.786, "r_x1": 91.377, "r_y1": 468.786, "r_x2": 91.377, "r_y2": 460.234, "r_x3": 50.112, "r_y3": 460.234, "coord_origin": "TOPLEFT"}, "text": "following:", "orig": "following:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The loss used to train the TableFormer can be defined as following:"}, {"label": "formula", "id": 15, "page_no": 5, "cluster": {"id": 15, "label": "formula", "bbox": {"l": 124.33, "t": 493.391, "r": 286.362, "b": 517.9639999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9423348307609558, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.715, "r_y0": 502.097, "r_x1": 128.688, "r_y1": 502.097, "r_x2": 128.688, "r_y2": 493.391, "r_x3": 125.715, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.688, "r_y0": 503.02, "r_x1": 140.642, "r_y1": 503.02, "r_x2": 140.642, "r_y2": 496.926, "r_x3": 128.688, "r_y3": 496.926, "coord_origin": "TOPLEFT"}, "text": "box", "orig": "box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.907, "r_y0": 502.097, "r_x1": 151.656, "r_y1": 502.097, "r_x2": 151.656, "r_y2": 493.391, "r_x3": 143.907, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.423, "r_y0": 502.097, "r_x1": 160.234, "r_y1": 502.097, "r_x2": 160.234, "r_y2": 493.391, "r_x3": 154.423, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.235, "r_y0": 503.02, "r_x1": 186.628, "r_y1": 503.02, "r_x2": 186.628, "r_y2": 496.926, "r_x3": 160.235, "r_y3": 496.926, "coord_origin": "TOPLEFT"}, "text": "iou iou", "orig": "iou iou", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.194, "r_y0": 502.097, "r_x1": 175.167, "r_y1": 502.097, "r_x2": 175.167, "r_y2": 493.391, "r_x3": 172.194, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 189.34, "r_y0": 502.097, "r_x1": 197.089, "r_y1": 502.097, "r_x2": 197.089, "r_y2": 493.391, "r_x3": 189.34, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "+", "orig": "+", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.303, "r_y0": 502.097, "r_x1": 205.114, "r_y1": 502.097, "r_x2": 205.114, "r_y2": 493.391, "r_x3": 199.303, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 205.115, "r_y0": 503.02, "r_x1": 207.635, "r_y1": 503.02, "r_x2": 207.635, "r_y2": 496.926, "r_x3": 205.115, "r_y3": 496.926, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.675, "r_y0": 503.02, "r_x1": 211.647, "r_y1": 503.02, "r_x2": 211.647, "r_y2": 496.926, "r_x3": 207.675, "r_y3": 496.926, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.33, "r_y0": 517.0409999999999, "r_x1": 127.303, "r_y1": 517.0409999999999, "r_x2": 127.303, "r_y2": 508.335, "r_x3": 124.33, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 130.266, "r_y0": 517.0409999999999, "r_x1": 138.015, "r_y1": 517.0409999999999, "r_x2": 138.015, "r_y2": 508.335, "r_x3": 130.266, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.782, "r_y0": 517.0409999999999, "r_x1": 149.566, "r_y1": 517.0409999999999, "r_x2": 149.566, "r_y2": 508.335, "r_x3": 140.782, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "\u03bbl", "orig": "\u03bbl", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.566, "r_y0": 517.9639999999999, "r_x1": 153.326, "r_y1": 517.9639999999999, "r_x2": 153.326, "r_y2": 511.87, "r_x3": 149.566, "r_y3": 511.87, "coord_origin": "TOPLEFT"}, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 156.039, "r_y0": 517.0409999999999, "r_x1": 174.855, "r_y1": 517.0409999999999, "r_x2": 174.855, "r_y2": 508.335, "r_x3": 156.039, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "+(1", "orig": "+(1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.071, "r_y0": 516.899, "r_x1": 184.82, "r_y1": 516.899, "r_x2": 184.82, "r_y2": 508.335, "r_x3": 177.071, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.033, "r_y0": 517.0409999999999, "r_x1": 199.692, "r_y1": 517.0409999999999, "r_x2": 199.692, "r_y2": 508.335, "r_x3": 187.033, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "\u03bb l", "orig": "\u03bb l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 192.845, "r_y0": 517.0409999999999, "r_x1": 196.719, "r_y1": 517.0409999999999, "r_x2": 196.719, "r_y2": 508.335, "r_x3": 192.845, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.692, "r_y0": 517.9639999999999, "r_x1": 211.646, "r_y1": 517.9639999999999, "r_x2": 211.646, "r_y2": 511.87, "r_x3": 199.692, "r_y3": 511.87, "coord_origin": "TOPLEFT"}, "text": "box", "orig": "box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.746, "r_y0": 509.832, "r_x1": 286.362, "r_y1": 509.832, "r_x2": 286.362, "r_y2": 501.28, "r_x3": 274.746, "r_y3": 501.28, "coord_origin": "TOPLEFT"}, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "l box = \u03bb iou iou l + \u03bb l 1 l = \u03bbl s +(1 -\u03bb l ) box (1)"}, {"label": "text", "id": 16, "page_no": 5, "cluster": {"id": 16, "label": "text", "bbox": {"l": 50.112, "t": 531.26, "r": 281.597, "b": 540.889, "coord_origin": "TOPLEFT"}, "confidence": 0.9363929629325867, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 540.13, "r_x1": 74.451, "r_y1": 540.13, "r_x2": 74.451, "r_y2": 531.578, "r_x3": 50.112, "r_y3": 531.578, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.941, "r_y0": 539.966, "r_x1": 82.752, "r_y1": 539.966, "r_x2": 82.752, "r_y2": 531.26, "r_x3": 76.941, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.52, "r_y0": 539.8240000000001, "r_x1": 92.162, "r_y1": 539.8240000000001, "r_x2": 92.162, "r_y2": 531.26, "r_x3": 85.52, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": "\u2208", "orig": "\u2208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.653, "r_y0": 540.13, "r_x1": 135.599, "r_y1": 540.13, "r_x2": 135.599, "r_y2": 531.578, "r_x3": 94.653, "r_y3": 531.578, "coord_origin": "TOPLEFT"}, "text": "[0, 1], and", "orig": "[0, 1], and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.09, "r_y0": 539.966, "r_x1": 143.901, "r_y1": 539.966, "r_x2": 143.901, "r_y2": 531.26, "r_x3": 138.09, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.901, "r_y0": 540.889, "r_x1": 155.362, "r_y1": 540.889, "r_x2": 155.362, "r_y2": 534.7950000000001, "r_x3": 143.901, "r_y3": 534.7950000000001, "coord_origin": "TOPLEFT"}, "text": "iou", "orig": "iou", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.861, "r_y0": 539.966, "r_x1": 166.104, "r_y1": 539.966, "r_x2": 166.104, "r_y2": 531.26, "r_x3": 155.861, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": ", \u03bb", "orig": ", \u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.1, "r_y0": 540.889, "r_x1": 168.62, "r_y1": 540.889, "r_x2": 168.62, "r_y2": 534.7950000000001, "r_x3": 166.1, "r_y3": 534.7950000000001, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.66, "r_y0": 540.889, "r_x1": 172.632, "r_y1": 540.889, "r_x2": 172.632, "r_y2": 534.7950000000001, "r_x3": 168.66, "r_y3": 534.7950000000001, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.897, "r_y0": 539.8240000000001, "r_x1": 182.539, "r_y1": 539.8240000000001, "r_x2": 182.539, "r_y2": 531.26, "r_x3": 175.897, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": "\u2208", "orig": "\u2208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.306, "r_y0": 538.064, "r_x1": 192.501, "r_y1": 538.064, "r_x2": 192.501, "r_y2": 533.441, "r_x3": 185.306, "r_y3": 533.441, "coord_origin": "TOPLEFT"}, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.992, "r_y0": 540.13, "r_x1": 281.597, "r_y1": 540.13, "r_x2": 281.597, "r_y2": 531.578, "r_x3": 194.992, "r_y3": 531.578, "coord_origin": "TOPLEFT"}, "text": "are hyper-parameters.", "orig": "are hyper-parameters.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "where \u03bb \u2208 [0, 1], and \u03bb iou , \u03bb l 1 \u2208 R are hyper-parameters."}, {"label": "section_header", "id": 12, "page_no": 5, "cluster": {"id": 12, "label": "section_header", "bbox": {"l": 50.112, "t": 555.917, "r": 171.983, "b": 566.665, "coord_origin": "TOPLEFT"}, "confidence": 0.9554555416107178, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 566.665, "r_x1": 171.983, "r_y1": 566.665, "r_x2": 171.983, "r_y2": 555.917, "r_x3": 50.112, "r_y3": 555.917, "coord_origin": "TOPLEFT"}, "text": "5. Experimental Results", "orig": "5. Experimental Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5. Experimental Results"}, {"label": "section_header", "id": 13, "page_no": 5, "cluster": {"id": 13, "label": "section_header", "bbox": {"l": 50.112, "t": 576.264, "r": 179.175, "b": 586.116, "coord_origin": "TOPLEFT"}, "confidence": 0.9538503289222717, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 586.116, "r_x1": 179.175, "r_y1": 586.116, "r_x2": 179.175, "r_y2": 576.264, "r_x3": 50.112, "r_y3": 576.264, "coord_origin": "TOPLEFT"}, "text": "5.1. Implementation Details", "orig": "5.1. Implementation Details", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.1. Implementation Details"}, {"label": "text", "id": 7, "page_no": 5, "cluster": {"id": 7, "label": "text", "bbox": {"l": 50.112, "t": 595.8240000000001, "r": 286.365, "b": 640.421, "coord_origin": "TOPLEFT"}, "confidence": 0.9856163263320923, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 604.5550000000001, "r_x1": 202.978, "r_y1": 604.5550000000001, "r_x2": 202.978, "r_y2": 596.0029999999999, "r_x3": 62.067, "r_y3": 596.0029999999999, "coord_origin": "TOPLEFT"}, "text": "TableFormer uses ResNet-18 as the", "orig": "TableFormer uses ResNet-18 as the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 205.384, "r_y0": 604.412, "r_x1": 286.36, "r_y1": 604.412, "r_x2": 286.36, "r_y2": 595.8240000000001, "r_x3": 205.384, "r_y3": 595.8240000000001, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Net-", "orig": "CNN Backbone Net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 616.367, "r_x1": 70.037, "r_y1": 616.367, "r_x2": 70.037, "r_y2": 607.779, "r_x3": 50.112, "r_y3": 607.779, "coord_origin": "TOPLEFT"}, "text": "work", "orig": "work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 616.51, "r_x1": 72.528, "r_y1": 616.51, "r_x2": 72.528, "r_y2": 607.958, "r_x3": 70.037, "r_y3": 607.958, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 77.14, "r_y0": 616.51, "r_x1": 286.365, "r_y1": 616.51, "r_x2": 286.365, "r_y2": 607.958, "r_x3": 77.14, "r_y3": 607.958, "coord_origin": "TOPLEFT"}, "text": "The input images are resized to 448*448 pixels and", "orig": "The input images are resized to 448*448 pixels and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 628.465, "r_x1": 286.365, "r_y1": 628.465, "r_x2": 286.365, "r_y2": 619.913, "r_x3": 50.112, "r_y3": 619.913, "coord_origin": "TOPLEFT"}, "text": "the feature map has a dimension of 28*28. Additionally, we", "orig": "the feature map has a dimension of 28*28. Additionally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 640.421, "r_x1": 207.033, "r_y1": 640.421, "r_x2": 207.033, "r_y2": 631.869, "r_x3": 50.112, "r_y3": 631.869, "coord_origin": "TOPLEFT"}, "text": "enforce the following input constraints:", "orig": "enforce the following input constraints:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TableFormer uses ResNet-18 as the CNN Backbone Network . The input images are resized to 448*448 pixels and the feature map has a dimension of 28*28. Additionally, we enforce the following input constraints:"}, {"label": "formula", "id": 18, "page_no": 5, "cluster": {"id": 18, "label": "formula", "bbox": {"l": 91.661, "t": 654.496, "r": 286.362, "b": 678.31, "coord_origin": "TOPLEFT"}, "confidence": 0.844183623790741, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.661, "r_y0": 663.366, "r_x1": 186.017, "r_y1": 663.366, "r_x2": 186.017, "r_y2": 654.814, "r_x3": 91.661, "r_y3": 654.814, "coord_origin": "TOPLEFT"}, "text": "Image width and height", "orig": "Image width and height", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 188.507, "r_y0": 663.06, "r_x1": 196.256, "r_y1": 663.06, "r_x2": 196.256, "r_y2": 654.496, "r_x3": 188.507, "r_y3": 654.496, "coord_origin": "TOPLEFT"}, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.746, "r_y0": 663.366, "r_x1": 244.813, "r_y1": 663.366, "r_x2": 244.813, "r_y2": 654.814, "r_x3": 198.746, "r_y3": 654.814, "coord_origin": "TOPLEFT"}, "text": "1024 pixels", "orig": "1024 pixels", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.016, "r_y0": 678.31, "r_x1": 186.246, "r_y1": 678.31, "r_x2": 186.246, "r_y2": 669.758, "r_x3": 101.016, "r_y3": 669.758, "coord_origin": "TOPLEFT"}, "text": "Structural tags length", "orig": "Structural tags length", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 188.736, "r_y0": 678.004, "r_x1": 196.485, "r_y1": 678.004, "r_x2": 196.485, "r_y2": 669.44, "r_x3": 188.736, "r_y3": 669.44, "coord_origin": "TOPLEFT"}, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.975, "r_y0": 678.31, "r_x1": 244.813, "r_y1": 678.31, "r_x2": 244.813, "r_y2": 669.758, "r_x3": 198.975, "r_y3": 669.758, "coord_origin": "TOPLEFT"}, "text": "512 tokens.", "orig": "512 tokens.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.746, "r_y0": 670.938, "r_x1": 286.362, "r_y1": 670.938, "r_x2": 286.362, "r_y2": 662.386, "r_x3": 274.746, "r_y3": 662.386, "coord_origin": "TOPLEFT"}, "text": "(2)", "orig": "(2)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Image width and height \u2264 1024 pixels Structural tags length \u2264 512 tokens. (2)"}, {"label": "text", "id": 10, "page_no": 5, "cluster": {"id": 10, "label": "text", "bbox": {"l": 50.112, "t": 692.559, "r": 286.365, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9724979996681213, "cells": [{"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Although input constraints are used also by other methods,", "orig": "Although input constraints are used also by other methods,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "such as EDD, ours are less restrictive due to the improved", "orig": "such as EDD, ours are less restrictive due to the improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Although input constraints are used also by other methods, such as EDD, ours are less restrictive due to the improved"}, {"label": "text", "id": 9, "page_no": 5, "cluster": {"id": 9, "label": "text", "bbox": {"l": 308.862, "t": 75.47699999999998, "r": 545.115, "b": 107.93899999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9799237847328186, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 545.115, "r_y1": 84.029, "r_x2": 545.115, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "runtime performance and lower memory footprint of Table-", "orig": "runtime performance and lower memory footprint of Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 95.98400000000004, "r_x1": 339.985, "r_y1": 95.98400000000004, "r_x2": 339.985, "r_y2": 87.43200000000002, "r_x3": 308.862, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "Former.", "orig": "Former.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.889, "r_y0": 95.98400000000004, "r_x1": 545.115, "r_y1": 95.98400000000004, "r_x2": 545.115, "r_y2": 87.43200000000002, "r_x3": 346.889, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "This allows to utilize input samples with longer", "orig": "This allows to utilize input samples with longer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 107.93899999999996, "r_x1": 492.961, "r_y1": 107.93899999999996, "r_x2": 492.961, "r_y2": 99.38699999999994, "r_x3": 308.862, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "sequences and images with larger dimensions.", "orig": "sequences and images with larger dimensions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "runtime performance and lower memory footprint of TableFormer. This allows to utilize input samples with longer sequences and images with larger dimensions."}, {"label": "text", "id": 1, "page_no": 5, "cluster": {"id": 1, "label": "text", "bbox": {"l": 308.862, "t": 116.49800000000005, "r": 545.115, "b": 328.288, "coord_origin": "TOPLEFT"}, "confidence": 0.9880930781364441, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 125.04999999999995, "r_x1": 545.115, "r_y1": 125.04999999999995, "r_x2": 545.115, "r_y2": 116.49800000000005, "r_x3": 320.817, "r_y3": 116.49800000000005, "coord_origin": "TOPLEFT"}, "text": "The Transformer Encoder consists of two 'Transformer", "orig": "The Transformer Encoder consists of two 'Transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 137.005, "r_x1": 545.115, "r_y1": 137.005, "r_x2": 545.115, "r_y2": 128.45299999999997, "r_x3": 308.862, "r_y3": 128.45299999999997, "coord_origin": "TOPLEFT"}, "text": "Encoder Layers', with an input feature size of 512, feed", "orig": "Encoder Layers', with an input feature size of 512, feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 148.96000000000004, "r_x1": 545.115, "r_y1": 148.96000000000004, "r_x2": 545.115, "r_y2": 140.40800000000002, "r_x3": 308.862, "r_y3": 140.40800000000002, "coord_origin": "TOPLEFT"}, "text": "forward network of 1024, and 4 attention heads. As for the", "orig": "forward network of 1024, and 4 attention heads. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 160.91499999999996, "r_x1": 545.115, "r_y1": 160.91499999999996, "r_x2": 545.115, "r_y2": 152.36300000000006, "r_x3": 308.862, "r_y3": 152.36300000000006, "coord_origin": "TOPLEFT"}, "text": "Transformer Decoder it is composed of four 'Transformer", "orig": "Transformer Decoder it is composed of four 'Transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 172.87, "r_x1": 545.115, "r_y1": 172.87, "r_x2": 545.115, "r_y2": 164.31799999999998, "r_x3": 308.862, "r_y3": 164.31799999999998, "coord_origin": "TOPLEFT"}, "text": "Decoder Layers' with similar input and output dimensions", "orig": "Decoder Layers' with similar input and output dimensions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 184.82600000000002, "r_x1": 317.161, "r_y1": 184.82600000000002, "r_x2": 317.161, "r_y2": 176.274, "r_x3": 308.862, "r_y3": 176.274, "coord_origin": "TOPLEFT"}, "text": "as", "orig": "as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 321.365, "r_y0": 184.82600000000002, "r_x1": 333.539, "r_y1": 184.82600000000002, "r_x2": 333.539, "r_y2": 176.274, "r_x3": 321.365, "r_y3": 176.274, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.734, "r_y0": 184.82600000000002, "r_x1": 467.218, "r_y1": 184.82600000000002, "r_x2": 467.218, "r_y2": 176.274, "r_x3": 337.734, "r_y3": 176.274, "coord_origin": "TOPLEFT"}, "text": "'Transformer Encoder Layers'.", "orig": "'Transformer Encoder Layers'.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.437, "r_y0": 184.82600000000002, "r_x1": 545.115, "r_y1": 184.82600000000002, "r_x2": 545.115, "r_y2": 176.274, "r_x3": 475.437, "r_y3": 176.274, "coord_origin": "TOPLEFT"}, "text": "Even though our", "orig": "Even though our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 196.78099999999995, "r_x1": 545.115, "r_y1": 196.78099999999995, "r_x2": 545.115, "r_y2": 188.22900000000004, "r_x3": 308.862, "r_y3": 188.22900000000004, "coord_origin": "TOPLEFT"}, "text": "model uses fewer layers and heads than the default imple-", "orig": "model uses fewer layers and heads than the default imple-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 208.736, "r_x1": 399.213, "r_y1": 208.736, "r_x2": 399.213, "r_y2": 200.18399999999997, "r_x3": 308.862, "r_y3": 200.18399999999997, "coord_origin": "TOPLEFT"}, "text": "mentation parameters,", "orig": "mentation parameters,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 403.965, "r_y0": 208.736, "r_x1": 458.63, "r_y1": 208.736, "r_x2": 458.63, "r_y2": 200.18399999999997, "r_x3": 403.965, "r_y3": 200.18399999999997, "coord_origin": "TOPLEFT"}, "text": "our extensive", "orig": "our extensive", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 462.934, "r_y0": 208.736, "r_x1": 545.115, "r_y1": 208.736, "r_x2": 545.115, "r_y2": 200.18399999999997, "r_x3": 462.934, "r_y3": 200.18399999999997, "coord_origin": "TOPLEFT"}, "text": "experimentation has", "orig": "experimentation has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 220.69100000000003, "r_x1": 527.84, "r_y1": 220.69100000000003, "r_x2": 527.84, "r_y2": 212.139, "r_x3": 308.862, "r_y3": 212.139, "coord_origin": "TOPLEFT"}, "text": "proved this setup to be more suitable for table images.", "orig": "proved this setup to be more suitable for table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.084, "r_y0": 220.69100000000003, "r_x1": 545.115, "r_y1": 220.69100000000003, "r_x2": 545.115, "r_y2": 212.139, "r_x3": 532.084, "r_y3": 212.139, "coord_origin": "TOPLEFT"}, "text": "We", "orig": "We", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 232.64599999999996, "r_x1": 341.868, "r_y1": 232.64599999999996, "r_x2": 341.868, "r_y2": 224.09400000000005, "r_x3": 308.862, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "attribute", "orig": "attribute", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.371, "r_y0": 232.64599999999996, "r_x1": 360.767, "r_y1": 232.64599999999996, "r_x2": 360.767, "r_y2": 224.09400000000005, "r_x3": 346.371, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.27, "r_y0": 232.64599999999996, "r_x1": 393.504, "r_y1": 232.64599999999996, "r_x2": 393.504, "r_y2": 224.09400000000005, "r_x3": 365.27, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "finding", "orig": "finding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.007, "r_y0": 232.64599999999996, "r_x1": 405.758, "r_y1": 232.64599999999996, "r_x2": 405.758, "r_y2": 224.09400000000005, "r_x3": 398.007, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.261, "r_y0": 232.64599999999996, "r_x1": 422.436, "r_y1": 232.64599999999996, "r_x2": 422.436, "r_y2": 224.09400000000005, "r_x3": 410.261, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.939, "r_y0": 232.64599999999996, "r_x1": 459.586, "r_y1": 232.64599999999996, "r_x2": 459.586, "r_y2": 224.09400000000005, "r_x3": 426.939, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "inherent", "orig": "inherent", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 464.089, "r_y0": 232.64599999999996, "r_x1": 490.102, "r_y1": 232.64599999999996, "r_x2": 490.102, "r_y2": 224.09400000000005, "r_x3": 464.089, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "design", "orig": "design", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 494.605, "r_y0": 232.64599999999996, "r_x1": 502.904, "r_y1": 232.64599999999996, "r_x2": 502.904, "r_y2": 224.09400000000005, "r_x3": 494.605, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 507.407, "r_y0": 232.64599999999996, "r_x1": 526.774, "r_y1": 232.64599999999996, "r_x2": 526.774, "r_y2": 224.09400000000005, "r_x3": 507.407, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 531.277, "r_y0": 232.64599999999996, "r_x1": 545.115, "r_y1": 232.64599999999996, "r_x2": 545.115, "r_y2": 224.09400000000005, "r_x3": 531.277, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "im-", "orig": "im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 244.601, "r_x1": 545.115, "r_y1": 244.601, "r_x2": 545.115, "r_y2": 236.04899999999998, "r_x3": 308.862, "r_y3": 236.04899999999998, "coord_origin": "TOPLEFT"}, "text": "ages, which contain mostly lines and text, unlike the more", "orig": "ages, which contain mostly lines and text, unlike the more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 256.557, "r_x1": 496.169, "r_y1": 256.557, "r_x2": 496.169, "r_y2": 248.005, "r_x3": 308.862, "r_y3": 248.005, "coord_origin": "TOPLEFT"}, "text": "elaborate content present in other scopes (e.g.", "orig": "elaborate content present in other scopes (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 501.897, "r_y0": 256.557, "r_x1": 545.115, "r_y1": 256.557, "r_x2": 545.115, "r_y2": 248.005, "r_x3": 501.897, "r_y3": 248.005, "coord_origin": "TOPLEFT"}, "text": "the COCO", "orig": "the COCO", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 268.51199999999994, "r_x1": 342.336, "r_y1": 268.51199999999994, "r_x2": 342.336, "r_y2": 259.96000000000004, "r_x3": 308.862, "r_y3": 259.96000000000004, "coord_origin": "TOPLEFT"}, "text": "dataset).", "orig": "dataset).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.952, "r_y0": 268.51199999999994, "r_x1": 545.115, "r_y1": 268.51199999999994, "r_x2": 545.115, "r_y2": 259.96000000000004, "r_x3": 348.952, "r_y3": 259.96000000000004, "coord_origin": "TOPLEFT"}, "text": "Moreover, we have added ResNet blocks to the", "orig": "Moreover, we have added ResNet blocks to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 280.467, "r_x1": 545.115, "r_y1": 280.467, "r_x2": 545.115, "r_y2": 271.91499999999996, "r_x3": 308.862, "r_y3": 271.91499999999996, "coord_origin": "TOPLEFT"}, "text": "inputs of the Structure Decoder and Cell BBox Decoder.", "orig": "inputs of the Structure Decoder and Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 292.422, "r_x1": 545.115, "r_y1": 292.422, "r_x2": 545.115, "r_y2": 283.87, "r_x3": 308.862, "r_y3": 283.87, "coord_origin": "TOPLEFT"}, "text": "This prevents a decoder having a stronger influence over the", "orig": "This prevents a decoder having a stronger influence over the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 304.377, "r_x1": 545.115, "r_y1": 304.377, "r_x2": 545.115, "r_y2": 295.825, "r_x3": 308.862, "r_y3": 295.825, "coord_origin": "TOPLEFT"}, "text": "learned weights which would damage the other prediction", "orig": "learned weights which would damage the other prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 316.332, "r_x1": 545.115, "r_y1": 316.332, "r_x2": 545.115, "r_y2": 307.78, "r_x3": 308.862, "r_y3": 307.78, "coord_origin": "TOPLEFT"}, "text": "task (structure vs bounding boxes), but learn task specific", "orig": "task (structure vs bounding boxes), but learn task specific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 328.288, "r_x1": 532.483, "r_y1": 328.288, "r_x2": 532.483, "r_y2": 319.736, "r_x3": 308.862, "r_y3": 319.736, "coord_origin": "TOPLEFT"}, "text": "weights instead. Lastly our dropout layers are set to 0.5.", "orig": "weights instead. Lastly our dropout layers are set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The Transformer Encoder consists of two 'Transformer Encoder Layers', with an input feature size of 512, feed forward network of 1024, and 4 attention heads. As for the Transformer Decoder it is composed of four 'Transformer Decoder Layers' with similar input and output dimensions as the 'Transformer Encoder Layers'. Even though our model uses fewer layers and heads than the default implementation parameters, our extensive experimentation has proved this setup to be more suitable for table images. We attribute this finding to the inherent design of table images, which contain mostly lines and text, unlike the more elaborate content present in other scopes (e.g. the COCO dataset). Moreover, we have added ResNet blocks to the inputs of the Structure Decoder and Cell BBox Decoder. This prevents a decoder having a stronger influence over the learned weights which would damage the other prediction task (structure vs bounding boxes), but learn task specific weights instead. Lastly our dropout layers are set to 0.5."}, {"label": "text", "id": 3, "page_no": 5, "cluster": {"id": 3, "label": "text", "bbox": {"l": 308.862, "t": 336.846, "r": 545.115, "b": 429.084, "coord_origin": "TOPLEFT"}, "confidence": 0.9877589344978333, "cells": [{"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 345.398, "r_x1": 545.115, "r_y1": 345.398, "r_x2": 545.115, "r_y2": 336.846, "r_x3": 320.817, "r_y3": 336.846, "coord_origin": "TOPLEFT"}, "text": "For training, TableFormer is trained with 3 Adam opti-", "orig": "For training, TableFormer is trained with 3 Adam opti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 357.353, "r_x1": 403.736, "r_y1": 357.353, "r_x2": 403.736, "r_y2": 348.801, "r_x3": 308.862, "r_y3": 348.801, "coord_origin": "TOPLEFT"}, "text": "mizers, each one for the", "orig": "mizers, each one for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 406.076, "r_y0": 357.21, "r_x1": 545.112, "r_y1": 357.21, "r_x2": 545.112, "r_y2": 348.622, "r_x3": 406.076, "r_y3": 348.622, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network Structure", "orig": "CNN Backbone Network Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 503.539, "r_y0": 357.353, "r_x1": 506.03, "r_y1": 357.353, "r_x2": 506.03, "r_y2": 348.801, "r_x3": 503.539, "r_y3": 348.801, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 369.165, "r_x1": 343.163, "r_y1": 369.165, "r_x2": 343.163, "r_y2": 360.577, "r_x3": 308.862, "r_y3": 360.577, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 343.163, "r_y0": 369.308, "r_x1": 362.202, "r_y1": 369.308, "r_x2": 362.202, "r_y2": 360.756, "r_x3": 343.163, "r_y3": 360.756, "coord_origin": "TOPLEFT"}, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 364.286, "r_y0": 369.165, "r_x1": 440.938, "r_y1": 369.165, "r_x2": 440.938, "r_y2": 360.577, "r_x3": 364.286, "r_y3": 360.577, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.939, "r_y0": 369.308, "r_x1": 443.43, "r_y1": 369.308, "r_x2": 443.43, "r_y2": 360.756, "r_x3": 440.939, "r_y3": 360.756, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 446.379, "r_y0": 369.308, "r_x1": 545.108, "r_y1": 369.308, "r_x2": 545.108, "r_y2": 360.756, "r_x3": 446.379, "r_y3": 360.756, "coord_origin": "TOPLEFT"}, "text": "Taking the PubTabNet as", "orig": "Taking the PubTabNet as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 381.263, "r_x1": 545.115, "r_y1": 381.263, "r_x2": 545.115, "r_y2": 372.711, "r_x3": 308.862, "r_y3": 372.711, "coord_origin": "TOPLEFT"}, "text": "an example for our parameter set up, the initializing learn-", "orig": "an example for our parameter set up, the initializing learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 393.219, "r_x1": 545.115, "r_y1": 393.219, "r_x2": 545.115, "r_y2": 384.667, "r_x3": 308.862, "r_y3": 384.667, "coord_origin": "TOPLEFT"}, "text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 405.01, "r_x1": 314.673, "r_y1": 405.01, "r_x2": 314.673, "r_y2": 396.304, "r_x3": 308.862, "r_y3": 396.304, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.658, "r_y0": 405.174, "r_x1": 329.726, "r_y1": 405.174, "r_x2": 329.726, "r_y2": 396.622, "r_x3": 318.658, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "set", "orig": "set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.711, "r_y0": 405.174, "r_x1": 341.462, "r_y1": 405.174, "r_x2": 341.462, "r_y2": 396.622, "r_x3": 333.711, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.447, "r_y0": 405.174, "r_x1": 360.391, "r_y1": 405.174, "r_x2": 360.391, "r_y2": 396.622, "r_x3": 345.447, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "0.5.", "orig": "0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.963, "r_y0": 405.174, "r_x1": 415.166, "r_y1": 405.174, "r_x2": 415.166, "r_y2": 396.622, "r_x3": 367.963, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "Afterwards,", "orig": "Afterwards,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 419.519, "r_y0": 405.174, "r_x1": 545.108, "r_y1": 405.174, "r_x2": 545.108, "r_y2": 396.622, "r_x3": 419.519, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "we reduce the learning rate to", "orig": "we reduce the learning rate to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 417.129, "r_x1": 545.115, "r_y1": 417.129, "r_x2": 545.115, "r_y2": 408.577, "r_x3": 308.862, "r_y3": 408.577, "coord_origin": "TOPLEFT"}, "text": "0.0001, the batch size to 18 and train for 12 more epochs or", "orig": "0.0001, the batch size to 18 and train for 12 more epochs or", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 429.084, "r_x1": 360.966, "r_y1": 429.084, "r_x2": 360.966, "r_y2": 420.532, "r_x3": 308.862, "r_y3": 420.532, "coord_origin": "TOPLEFT"}, "text": "convergence.", "orig": "convergence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "For training, TableFormer is trained with 3 Adam optimizers, each one for the CNN Backbone Network Structure , Decoder , and Cell BBox Decoder . Taking the PubTabNet as an example for our parameter set up, the initializing learning rate is 0.001 for 12 epochs with a batch size of 24, and \u03bb set to 0.5. Afterwards, we reduce the learning rate to 0.0001, the batch size to 18 and train for 12 more epochs or convergence."}, {"label": "text", "id": 0, "page_no": 5, "cluster": {"id": 0, "label": "text", "bbox": {"l": 308.862, "t": 437.643, "r": 545.115, "b": 553.7909999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9884491562843323, "cells": [{"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 446.195, "r_x1": 545.115, "r_y1": 446.195, "r_x2": 545.115, "r_y2": 437.643, "r_x3": 320.817, "r_y3": 437.643, "coord_origin": "TOPLEFT"}, "text": "TableFormer is implemented with PyTorch and Torchvi-", "orig": "TableFormer is implemented with PyTorch and Torchvi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 458.15, "r_x1": 384.628, "r_y1": 458.15, "r_x2": 384.628, "r_y2": 449.598, "r_x3": 308.862, "r_y3": 449.598, "coord_origin": "TOPLEFT"}, "text": "sion libraries [22].", "orig": "sion libraries [22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.372, "r_y0": 458.15, "r_x1": 545.115, "r_y1": 458.15, "r_x2": 545.115, "r_y2": 449.598, "r_x3": 391.372, "r_y3": 449.598, "coord_origin": "TOPLEFT"}, "text": "To speed up the inference, the image", "orig": "To speed up the inference, the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 470.105, "r_x1": 494.007, "r_y1": 470.105, "r_x2": 494.007, "r_y2": 461.553, "r_x3": 308.862, "r_y3": 461.553, "coord_origin": "TOPLEFT"}, "text": "undergoes a single forward pass through the", "orig": "undergoes a single forward pass through the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.078, "r_y0": 469.962, "r_x1": 545.111, "r_y1": 469.962, "r_x2": 545.111, "r_y2": 461.374, "r_x3": 498.078, "r_y3": 461.374, "coord_origin": "TOPLEFT"}, "text": "CNN Back-", "orig": "CNN Back-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 481.917, "r_x1": 364.443, "r_y1": 481.917, "r_x2": 364.443, "r_y2": 473.329, "r_x3": 308.862, "r_y3": 473.329, "coord_origin": "TOPLEFT"}, "text": "bone Network", "orig": "bone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.061, "r_y0": 482.06, "r_x1": 545.113, "r_y1": 482.06, "r_x2": 545.113, "r_y2": 473.508, "r_x3": 367.061, "r_y3": 473.508, "coord_origin": "TOPLEFT"}, "text": "and transformer encoder. This eliminates the", "orig": "and transformer encoder. This eliminates the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 494.015, "r_x1": 545.115, "r_y1": 494.015, "r_x2": 545.115, "r_y2": 485.463, "r_x3": 308.862, "r_y3": 485.463, "coord_origin": "TOPLEFT"}, "text": "overhead of generating the same features for each decoding", "orig": "overhead of generating the same features for each decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 505.97, "r_x1": 545.115, "r_y1": 505.97, "r_x2": 545.115, "r_y2": 497.418, "r_x3": 308.862, "r_y3": 497.418, "coord_origin": "TOPLEFT"}, "text": "step. Similarly, we employ a 'caching' technique to preform", "orig": "step. Similarly, we employ a 'caching' technique to preform", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 517.9259999999999, "r_x1": 432.588, "r_y1": 517.9259999999999, "r_x2": 432.588, "r_y2": 509.374, "r_x3": 308.862, "r_y3": 509.374, "coord_origin": "TOPLEFT"}, "text": "faster autoregressive decoding.", "orig": "faster autoregressive decoding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 517.9259999999999, "r_x1": 545.115, "r_y1": 517.9259999999999, "r_x2": 545.115, "r_y2": 509.374, "r_x3": 436.732, "r_y3": 509.374, "coord_origin": "TOPLEFT"}, "text": "This is achieved by storing", "orig": "This is achieved by storing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 529.881, "r_x1": 545.115, "r_y1": 529.881, "r_x2": 545.115, "r_y2": 521.329, "r_x3": 308.862, "r_y3": 521.329, "coord_origin": "TOPLEFT"}, "text": "the features of decoded tokens so we can reuse them for", "orig": "the features of decoded tokens so we can reuse them for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 541.836, "r_x1": 370.062, "r_y1": 541.836, "r_x2": 370.062, "r_y2": 533.284, "r_x3": 308.862, "r_y3": 533.284, "coord_origin": "TOPLEFT"}, "text": "each time step.", "orig": "each time step.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.721, "r_y0": 541.836, "r_x1": 545.115, "r_y1": 541.836, "r_x2": 545.115, "r_y2": 533.284, "r_x3": 375.721, "r_y3": 533.284, "coord_origin": "TOPLEFT"}, "text": "Therefore, we only compute the attention", "orig": "Therefore, we only compute the attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 553.7909999999999, "r_x1": 377.215, "r_y1": 553.7909999999999, "r_x2": 377.215, "r_y2": 545.239, "r_x3": 308.862, "r_y3": 545.239, "coord_origin": "TOPLEFT"}, "text": "for each new tag.", "orig": "for each new tag.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TableFormer is implemented with PyTorch and Torchvision libraries [22]. To speed up the inference, the image undergoes a single forward pass through the CNN Backbone Network and transformer encoder. This eliminates the overhead of generating the same features for each decoding step. Similarly, we employ a 'caching' technique to preform faster autoregressive decoding. This is achieved by storing the features of decoded tokens so we can reuse them for each time step. Therefore, we only compute the attention for each new tag."}, {"label": "section_header", "id": 14, "page_no": 5, "cluster": {"id": 14, "label": "section_header", "bbox": {"l": 308.862, "t": 579.554, "r": 397.443, "b": 589.406, "coord_origin": "TOPLEFT"}, "confidence": 0.9450808763504028, "cells": [{"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 589.406, "r_x1": 397.443, "r_y1": 589.406, "r_x2": 397.443, "r_y2": 579.554, "r_x3": 308.862, "r_y3": 579.554, "coord_origin": "TOPLEFT"}, "text": "5.2. Generalization", "orig": "5.2. Generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.2. Generalization"}, {"label": "text", "id": 2, "page_no": 5, "cluster": {"id": 2, "label": "text", "bbox": {"l": 308.862, "t": 603.718, "r": 545.115, "b": 672.046, "coord_origin": "TOPLEFT"}, "confidence": 0.9880595803260803, "cells": [{"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 612.27, "r_x1": 545.115, "r_y1": 612.27, "r_x2": 545.115, "r_y2": 603.718, "r_x3": 320.817, "r_y3": 603.718, "coord_origin": "TOPLEFT"}, "text": "TableFormer is evaluated on three major publicly avail-", "orig": "TableFormer is evaluated on three major publicly avail-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 624.225, "r_x1": 545.115, "r_y1": 624.225, "r_x2": 545.115, "r_y2": 615.673, "r_x3": 308.862, "r_y3": 615.673, "coord_origin": "TOPLEFT"}, "text": "able datasets of different nature to prove the generalization", "orig": "able datasets of different nature to prove the generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 636.1800000000001, "r_x1": 545.115, "r_y1": 636.1800000000001, "r_x2": 545.115, "r_y2": 627.6279999999999, "r_x3": 308.862, "r_y3": 627.6279999999999, "coord_origin": "TOPLEFT"}, "text": "and effectiveness of our model. The datasets used for eval-", "orig": "and effectiveness of our model. The datasets used for eval-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 648.135, "r_x1": 545.115, "r_y1": 648.135, "r_x2": 545.115, "r_y2": 639.583, "r_x3": 308.862, "r_y3": 639.583, "coord_origin": "TOPLEFT"}, "text": "uation are the PubTabNet, FinTabNet and TableBank which", "orig": "uation are the PubTabNet, FinTabNet and TableBank which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 660.091, "r_x1": 545.115, "r_y1": 660.091, "r_x2": 545.115, "r_y2": 651.539, "r_x3": 308.862, "r_y3": 651.539, "coord_origin": "TOPLEFT"}, "text": "stem from the scientific, financial and general domains re-", "orig": "stem from the scientific, financial and general domains re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 672.046, "r_x1": 350.705, "r_y1": 672.046, "r_x2": 350.705, "r_y2": 663.494, "r_x3": 308.862, "r_y3": 663.494, "coord_origin": "TOPLEFT"}, "text": "spectively.", "orig": "spectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TableFormer is evaluated on three major publicly available datasets of different nature to prove the generalization and effectiveness of our model. The datasets used for evaluation are the PubTabNet, FinTabNet and TableBank which stem from the scientific, financial and general domains respectively."}, {"label": "text", "id": 8, "page_no": 5, "cluster": {"id": 8, "label": "text", "bbox": {"l": 308.862, "t": 680.604, "r": 545.115, "b": 713.067, "coord_origin": "TOPLEFT"}, "confidence": 0.9830910563468933, "cells": [{"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 320.817, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "We also share our baseline results on the challenging", "orig": "We also share our baseline results on the challenging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 361.196, "r_y1": 701.111, "r_x2": 361.196, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 203, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.057, "r_y0": 701.111, "r_x1": 396.214, "r_y1": 701.111, "r_x2": 396.214, "r_y2": 692.559, "r_x3": 366.057, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "dataset.", "orig": "dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 204, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 406.406, "r_y0": 701.111, "r_x1": 453.449, "r_y1": 701.111, "r_x2": 453.449, "r_y2": 692.559, "r_x3": 406.406, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Throughout", "orig": "Throughout", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 205, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.311, "r_y0": 701.111, "r_x1": 471.591, "r_y1": 701.111, "r_x2": 471.591, "r_y2": 692.559, "r_x3": 458.311, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 206, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.453, "r_y0": 701.111, "r_x1": 527.481, "r_y1": 701.111, "r_x2": 527.481, "r_y2": 692.559, "r_x3": 476.453, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "experiments,", "orig": "experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 207, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.941, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 532.941, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 208, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.067, "r_x1": 495.94, "r_y1": 713.067, "r_x2": 495.94, "r_y2": 704.515, "r_x3": 308.862, "r_y3": 704.515, "coord_origin": "TOPLEFT"}, "text": "same parameters stated in Sec. 5.1 are utilized.", "orig": "same parameters stated in Sec. 5.1 are utilized.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We also share our baseline results on the challenging SynthTabNet dataset. Throughout our experiments, the same parameters stated in Sec. 5.1 are utilized."}, {"label": "page_footer", "id": 17, "page_no": 5, "cluster": {"id": 17, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8820409178733826, "cells": [{"index": 209, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "6"}], "body": [{"label": "text", "id": 5, "page_no": 5, "cluster": {"id": 5, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 286.365, "b": 155.76, "coord_origin": "TOPLEFT"}, "confidence": 0.9868090152740479, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 286.365, "r_y1": 84.029, "r_x2": 286.365, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "tention encoding is then multiplied to the encoded image to", "orig": "tention encoding is then multiplied to the encoded image to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 95.98400000000004, "r_x1": 286.365, "r_y1": 95.98400000000004, "r_x2": 286.365, "r_y2": 87.43200000000002, "r_x3": 50.112, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "produce a feature for each table cell. Notice that this is dif-", "orig": "produce a feature for each table cell. Notice that this is dif-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 107.93899999999996, "r_x1": 286.365, "r_y1": 107.93899999999996, "r_x2": 286.365, "r_y2": 99.38699999999994, "r_x3": 50.112, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "ferent than the typical object detection problem where im-", "orig": "ferent than the typical object detection problem where im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 119.894, "r_x1": 286.365, "r_y1": 119.894, "r_x2": 286.365, "r_y2": 111.34199999999998, "r_x3": 50.112, "r_y3": 111.34199999999998, "coord_origin": "TOPLEFT"}, "text": "balances between the number of detections and the amount", "orig": "balances between the number of detections and the amount", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 131.84900000000005, "r_x1": 135.691, "r_y1": 131.84900000000005, "r_x2": 135.691, "r_y2": 123.29700000000003, "r_x3": 50.112, "r_y3": 123.29700000000003, "coord_origin": "TOPLEFT"}, "text": "of objects may exist.", "orig": "of objects may exist.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.047, "r_y0": 131.84900000000005, "r_x1": 286.365, "r_y1": 131.84900000000005, "r_x2": 286.365, "r_y2": 123.29700000000003, "r_x3": 142.047, "r_y3": 123.29700000000003, "coord_origin": "TOPLEFT"}, "text": "In our case, we know up front that", "orig": "In our case, we know up front that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 143.80499999999995, "r_x1": 286.365, "r_y1": 143.80499999999995, "r_x2": 286.365, "r_y2": 135.25300000000004, "r_x3": 50.112, "r_y3": 135.25300000000004, "coord_origin": "TOPLEFT"}, "text": "the produced detections always match with the table cells", "orig": "the produced detections always match with the table cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 155.76, "r_x1": 175.163, "r_y1": 155.76, "r_x2": 175.163, "r_y2": 147.20799999999997, "r_x3": 50.112, "r_y3": 147.20799999999997, "coord_origin": "TOPLEFT"}, "text": "in number and correspondence.", "orig": "in number and correspondence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "tention encoding is then multiplied to the encoded image to produce a feature for each table cell. Notice that this is different than the typical object detection problem where imbalances between the number of detections and the amount of objects may exist. In our case, we know up front that the produced detections always match with the table cells in number and correspondence."}, {"label": "text", "id": 6, "page_no": 5, "cluster": {"id": 6, "label": "text", "bbox": {"l": 50.112, "t": 159.89300000000003, "r": 286.365, "b": 240.17700000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9860327839851379, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 168.44500000000005, "r_x1": 108.154, "r_y1": 168.44500000000005, "r_x2": 108.154, "r_y2": 159.89300000000003, "r_x3": 62.067, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "The output", "orig": "The output", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.275, "r_y0": 168.44500000000005, "r_x1": 144.806, "r_y1": 168.44500000000005, "r_x2": 144.806, "r_y2": 159.89300000000003, "r_x3": 113.275, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "features", "orig": "features", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.937, "r_y0": 168.44500000000005, "r_x1": 161.554, "r_y1": 168.44500000000005, "r_x2": 161.554, "r_y2": 159.89300000000003, "r_x3": 149.937, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.684, "r_y0": 168.44500000000005, "r_x1": 184.936, "r_y1": 168.44500000000005, "r_x2": 184.936, "r_y2": 159.89300000000003, "r_x3": 166.684, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "each", "orig": "each", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 190.057, "r_y0": 168.44500000000005, "r_x1": 209.424, "r_y1": 168.44500000000005, "r_x2": 209.424, "r_y2": 159.89300000000003, "r_x3": 190.057, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.555, "r_y0": 168.44500000000005, "r_x1": 228.941, "r_y1": 168.44500000000005, "r_x2": 228.941, "r_y2": 159.89300000000003, "r_x3": 214.555, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "cell", "orig": "cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.061, "r_y0": 168.44500000000005, "r_x1": 246.226, "r_y1": 168.44500000000005, "r_x2": 246.226, "r_y2": 159.89300000000003, "r_x3": 234.061, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "are", "orig": "are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.356, "r_y0": 168.44500000000005, "r_x1": 268.512, "r_y1": 168.44500000000005, "r_x2": 268.512, "r_y2": 159.89300000000003, "r_x3": 251.356, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "then", "orig": "then", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 273.643, "r_y0": 168.44500000000005, "r_x1": 286.365, "r_y1": 168.44500000000005, "r_x2": 286.365, "r_y2": 159.89300000000003, "r_x3": 273.643, "r_y3": 159.89300000000003, "coord_origin": "TOPLEFT"}, "text": "fed", "orig": "fed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 180.40099999999995, "r_x1": 65.614, "r_y1": 180.40099999999995, "r_x2": 65.614, "r_y2": 171.84900000000005, "r_x3": 50.112, "r_y3": 171.84900000000005, "coord_origin": "TOPLEFT"}, "text": "into", "orig": "into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.107, "r_y0": 180.40099999999995, "r_x1": 82.281, "r_y1": 180.40099999999995, "r_x2": 82.281, "r_y2": 171.84900000000005, "r_x3": 70.107, "r_y3": 171.84900000000005, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.764, "r_y0": 180.40099999999995, "r_x1": 138.66, "r_y1": 180.40099999999995, "r_x2": 138.66, "r_y2": 171.84900000000005, "r_x3": 86.764, "r_y3": 171.84900000000005, "coord_origin": "TOPLEFT"}, "text": "feed-forward", "orig": "feed-forward", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.153, "r_y0": 180.40099999999995, "r_x1": 286.365, "r_y1": 180.40099999999995, "r_x2": 286.365, "r_y2": 171.84900000000005, "r_x3": 143.153, "r_y3": 171.84900000000005, "coord_origin": "TOPLEFT"}, "text": "network (FFN). The FFN consists", "orig": "network (FFN). The FFN consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 192.356, "r_x1": 286.365, "r_y1": 192.356, "r_x2": 286.365, "r_y2": 183.80399999999997, "r_x3": 50.112, "r_y3": 183.80399999999997, "coord_origin": "TOPLEFT"}, "text": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "orig": "of a Multi-Layer Perceptron (3 layers with ReLU activa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 204.31100000000004, "r_x1": 286.365, "r_y1": 204.31100000000004, "r_x2": 286.365, "r_y2": 195.75900000000001, "r_x3": 50.112, "r_y3": 195.75900000000001, "coord_origin": "TOPLEFT"}, "text": "tion function) that predicts the normalized coordinates for", "orig": "tion function) that predicts the normalized coordinates for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 216.26599999999996, "r_x1": 196.004, "r_y1": 216.26599999999996, "r_x2": 196.004, "r_y2": 207.71400000000006, "r_x3": 50.112, "r_y3": 207.71400000000006, "coord_origin": "TOPLEFT"}, "text": "the bounding box of each table cell.", "orig": "the bounding box of each table cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.786, "r_y0": 216.26599999999996, "r_x1": 286.365, "r_y1": 216.26599999999996, "r_x2": 286.365, "r_y2": 207.71400000000006, "r_x3": 200.786, "r_y3": 207.71400000000006, "coord_origin": "TOPLEFT"}, "text": "Finally, the predicted", "orig": "Finally, the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 228.221, "r_x1": 286.365, "r_y1": 228.221, "r_x2": 286.365, "r_y2": 219.66899999999998, "r_x3": 50.112, "r_y3": 219.66899999999998, "coord_origin": "TOPLEFT"}, "text": "bounding boxes are classified based on whether they are", "orig": "bounding boxes are classified based on whether they are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 240.17700000000002, "r_x1": 181.549, "r_y1": 240.17700000000002, "r_x2": 181.549, "r_y2": 231.625, "r_x3": 50.112, "r_y3": 231.625, "coord_origin": "TOPLEFT"}, "text": "empty or not using a linear layer.", "orig": "empty or not using a linear layer.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The output features for each table cell are then fed into the feed-forward network (FFN). The FFN consists of a Multi-Layer Perceptron (3 layers with ReLU activation function) that predicts the normalized coordinates for the bounding box of each table cell. Finally, the predicted bounding boxes are classified based on whether they are empty or not using a linear layer."}, {"label": "text", "id": 4, "page_no": 5, "cluster": {"id": 4, "label": "text", "bbox": {"l": 50.112, "t": 243.92200000000003, "r": 286.366, "b": 444.145, "coord_origin": "TOPLEFT"}, "confidence": 0.9873637557029724, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 252.87800000000004, "r_x1": 129.215, "r_y1": 252.87800000000004, "r_x2": 129.215, "r_y2": 243.92200000000003, "r_x3": 62.067, "r_y3": 243.92200000000003, "coord_origin": "TOPLEFT"}, "text": "Loss Functions.", "orig": "Loss Functions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.451, "r_y0": 252.86199999999997, "r_x1": 276.139, "r_y1": 252.86199999999997, "r_x2": 276.139, "r_y2": 244.30999999999995, "r_x3": 134.451, "r_y3": 244.30999999999995, "coord_origin": "TOPLEFT"}, "text": "We formulate a multi-task loss Eq.", "orig": "We formulate a multi-task loss Eq.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.379, "r_y0": 252.86199999999997, "r_x1": 286.361, "r_y1": 252.86199999999997, "r_x2": 286.361, "r_y2": 244.30999999999995, "r_x3": 281.379, "r_y3": 244.30999999999995, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 264.817, "r_x1": 134.685, "r_y1": 264.817, "r_x2": 134.685, "r_y2": 256.265, "r_x3": 50.112, "r_y3": 256.265, "coord_origin": "TOPLEFT"}, "text": "to train our network.", "orig": "to train our network.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.543, "r_y0": 264.817, "r_x1": 286.365, "r_y1": 264.817, "r_x2": 286.365, "r_y2": 256.265, "r_x3": 140.543, "r_y3": 256.265, "coord_origin": "TOPLEFT"}, "text": "The Cross-Entropy loss (denoted as", "orig": "The Cross-Entropy loss (denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 276.60900000000004, "r_x1": 53.085, "r_y1": 276.60900000000004, "r_x2": 53.085, "r_y2": 267.903, "r_x3": 50.112, "r_y3": 267.903, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.085, "r_y0": 277.53200000000004, "r_x1": 56.845, "r_y1": 277.53200000000004, "r_x2": 56.845, "r_y2": 271.438, "r_x3": 53.085, "r_y3": 271.438, "coord_origin": "TOPLEFT"}, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 57.343, "r_y0": 276.773, "r_x1": 135.4, "r_y1": 276.773, "r_x2": 135.4, "r_y2": 268.221, "r_x3": 57.343, "r_y3": 268.221, "coord_origin": "TOPLEFT"}, "text": ") is used to train the", "orig": ") is used to train the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.735, "r_y0": 276.63, "r_x1": 211.08, "r_y1": 276.63, "r_x2": 211.08, "r_y2": 268.04200000000003, "r_x3": 137.735, "r_y3": 268.04200000000003, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 213.637, "r_y0": 276.773, "r_x1": 286.364, "r_y1": 276.773, "r_x2": 286.364, "r_y2": 268.221, "r_x3": 213.637, "r_y3": 268.221, "coord_origin": "TOPLEFT"}, "text": "which predicts the", "orig": "which predicts the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 288.728, "r_x1": 158.824, "r_y1": 288.728, "r_x2": 158.824, "r_y2": 280.176, "r_x3": 50.112, "r_y3": 280.176, "coord_origin": "TOPLEFT"}, "text": "structure tokens. As for the", "orig": "structure tokens. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 161.318, "r_y0": 288.585, "r_x1": 238.797, "r_y1": 288.585, "r_x2": 238.797, "r_y2": 279.99699999999996, "r_x3": 161.318, "r_y3": 279.99699999999996, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.521, "r_y0": 288.728, "r_x1": 286.363, "r_y1": 288.728, "r_x2": 286.363, "r_y2": 280.176, "r_x3": 241.521, "r_y3": 280.176, "coord_origin": "TOPLEFT"}, "text": "it is trained", "orig": "it is trained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 300.683, "r_x1": 211.377, "r_y1": 300.683, "r_x2": 211.377, "r_y2": 292.131, "r_x3": 50.112, "r_y3": 292.131, "coord_origin": "TOPLEFT"}, "text": "with a combination of losses denoted as", "orig": "with a combination of losses denoted as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.271, "r_y0": 300.519, "r_x1": 217.244, "r_y1": 300.519, "r_x2": 217.244, "r_y2": 291.813, "r_x3": 214.271, "r_y3": 291.813, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.244, "r_y0": 301.442, "r_x1": 229.198, "r_y1": 301.442, "r_x2": 229.198, "r_y2": 295.348, "r_x3": 217.244, "r_y3": 295.348, "coord_origin": "TOPLEFT"}, "text": "box", "orig": "box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.696, "r_y0": 300.683, "r_x1": 232.187, "r_y1": 300.683, "r_x2": 232.187, "r_y2": 292.131, "r_x3": 229.696, "r_y3": 292.131, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.49, "r_y0": 300.519, "r_x1": 239.463, "r_y1": 300.519, "r_x2": 239.463, "r_y2": 291.813, "r_x3": 236.49, "r_y3": 291.813, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.463, "r_y0": 301.442, "r_x1": 251.417, "r_y1": 301.442, "r_x2": 251.417, "r_y2": 295.348, "r_x3": 239.463, "r_y3": 295.348, "coord_origin": "TOPLEFT"}, "text": "box", "orig": "box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 254.811, "r_y0": 300.683, "r_x1": 286.363, "r_y1": 300.683, "r_x2": 286.363, "r_y2": 292.131, "r_x3": 254.811, "r_y3": 292.131, "coord_origin": "TOPLEFT"}, "text": "consists", "orig": "consists", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 312.638, "r_x1": 137.454, "r_y1": 312.638, "r_x2": 137.454, "r_y2": 304.086, "r_x3": 50.112, "r_y3": 304.086, "coord_origin": "TOPLEFT"}, "text": "of the generally used", "orig": "of the generally used", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.298, "r_y0": 312.474, "r_x1": 144.271, "r_y1": 312.474, "r_x2": 144.271, "r_y2": 303.768, "r_x3": 141.298, "r_y3": 303.768, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 144.271, "r_y0": 313.398, "r_x1": 148.243, "r_y1": 313.398, "r_x2": 148.243, "r_y2": 307.304, "r_x3": 144.271, "r_y3": 307.304, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.586, "r_y0": 312.638, "r_x1": 286.364, "r_y1": 312.638, "r_x2": 286.364, "r_y2": 304.086, "r_x3": 152.586, "r_y3": 304.086, "coord_origin": "TOPLEFT"}, "text": "loss for object detection and the", "orig": "loss for object detection and the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 324.593, "r_x1": 89.683, "r_y1": 324.593, "r_x2": 89.683, "r_y2": 316.041, "r_x3": 50.112, "r_y3": 316.041, "coord_origin": "TOPLEFT"}, "text": "IoU loss (", "orig": "IoU loss (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 89.686, "r_y0": 324.429, "r_x1": 92.659, "r_y1": 324.429, "r_x2": 92.659, "r_y2": 315.723, "r_x3": 89.686, "r_y3": 315.723, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.659, "r_y0": 325.353, "r_x1": 104.12, "r_y1": 325.353, "r_x2": 104.12, "r_y2": 319.259, "r_x3": 92.659, "r_y3": 319.259, "coord_origin": "TOPLEFT"}, "text": "iou", "orig": "iou", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 104.618, "r_y0": 324.593, "r_x1": 286.366, "r_y1": 324.593, "r_x2": 286.366, "r_y2": 316.041, "r_x3": 104.618, "r_y3": 316.041, "coord_origin": "TOPLEFT"}, "text": ") to be scale invariant as explained in [25]. In", "orig": ") to be scale invariant as explained in [25]. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 336.549, "r_x1": 286.365, "r_y1": 336.549, "r_x2": 286.365, "r_y2": 327.997, "r_x3": 50.112, "r_y3": 327.997, "coord_origin": "TOPLEFT"}, "text": "comparison to DETR, we do not use the Hungarian algo-", "orig": "comparison to DETR, we do not use the Hungarian algo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 348.504, "r_x1": 286.365, "r_y1": 348.504, "r_x2": 286.365, "r_y2": 339.952, "r_x3": 50.112, "r_y3": 339.952, "coord_origin": "TOPLEFT"}, "text": "rithm [15] to match the predicted bounding boxes with the", "orig": "rithm [15] to match the predicted bounding boxes with the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 360.459, "r_x1": 286.365, "r_y1": 360.459, "r_x2": 286.365, "r_y2": 351.907, "r_x3": 50.112, "r_y3": 351.907, "coord_origin": "TOPLEFT"}, "text": "ground-truth boxes, as we have already achieved a one-to-", "orig": "ground-truth boxes, as we have already achieved a one-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 372.414, "r_x1": 286.365, "r_y1": 372.414, "r_x2": 286.365, "r_y2": 363.862, "r_x3": 50.112, "r_y3": 363.862, "coord_origin": "TOPLEFT"}, "text": "one match through two steps: 1) Our token input sequence", "orig": "one match through two steps: 1) Our token input sequence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 384.369, "r_x1": 286.365, "r_y1": 384.369, "r_x2": 286.365, "r_y2": 375.817, "r_x3": 50.112, "r_y3": 375.817, "coord_origin": "TOPLEFT"}, "text": "is naturally ordered, therefore the hidden states of the table", "orig": "is naturally ordered, therefore the hidden states of the table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 396.324, "r_x1": 286.365, "r_y1": 396.324, "r_x2": 286.365, "r_y2": 387.772, "r_x3": 50.112, "r_y3": 387.772, "coord_origin": "TOPLEFT"}, "text": "data cells are also in order when they are provided as in-", "orig": "data cells are also in order when they are provided as in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 408.28, "r_x1": 88.687, "r_y1": 408.28, "r_x2": 88.687, "r_y2": 399.728, "r_x3": 50.112, "r_y3": 399.728, "coord_origin": "TOPLEFT"}, "text": "put to the", "orig": "put to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.646, "r_y0": 408.137, "r_x1": 170.052, "r_y1": 408.137, "r_x2": 170.052, "r_y2": 399.549, "r_x3": 91.646, "r_y3": 399.549, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.051, "r_y0": 408.28, "r_x1": 172.542, "r_y1": 408.28, "r_x2": 172.542, "r_y2": 399.728, "r_x3": 170.051, "r_y3": 399.728, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.62, "r_y0": 408.28, "r_x1": 286.364, "r_y1": 408.28, "r_x2": 286.364, "r_y2": 399.728, "r_x3": 175.62, "r_y3": 399.728, "coord_origin": "TOPLEFT"}, "text": "and 2) Our bounding boxes", "orig": "and 2) Our bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 420.235, "r_x1": 181.967, "r_y1": 420.235, "r_x2": 181.967, "r_y2": 411.683, "r_x3": 50.112, "r_y3": 411.683, "coord_origin": "TOPLEFT"}, "text": "generation mechanism (see Sec.", "orig": "generation mechanism (see Sec.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 189.09, "r_y0": 420.235, "r_x1": 286.365, "r_y1": 420.235, "r_x2": 286.365, "r_y2": 411.683, "r_x3": 189.09, "r_y3": 411.683, "coord_origin": "TOPLEFT"}, "text": "3) ensures a one-to-one", "orig": "3) ensures a one-to-one", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 432.19, "r_x1": 286.365, "r_y1": 432.19, "r_x2": 286.365, "r_y2": 423.638, "r_x3": 50.112, "r_y3": 423.638, "coord_origin": "TOPLEFT"}, "text": "mapping between the cell content and its bounding box for", "orig": "mapping between the cell content and its bounding box for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 444.145, "r_x1": 158.296, "r_y1": 444.145, "r_x2": 158.296, "r_y2": 435.593, "r_x3": 50.112, "r_y3": 435.593, "coord_origin": "TOPLEFT"}, "text": "all post-processed datasets.", "orig": "all post-processed datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Loss Functions. We formulate a multi-task loss Eq. 2 to train our network. The Cross-Entropy loss (denoted as l s ) is used to train the Structure Decoder which predicts the structure tokens. As for the Cell BBox Decoder it is trained with a combination of losses denoted as l box . l box consists of the generally used l 1 loss for object detection and the IoU loss ( l iou ) to be scale invariant as explained in [25]. In comparison to DETR, we do not use the Hungarian algorithm [15] to match the predicted bounding boxes with the ground-truth boxes, as we have already achieved a one-toone match through two steps: 1) Our token input sequence is naturally ordered, therefore the hidden states of the table data cells are also in order when they are provided as input to the Cell BBox Decoder , and 2) Our bounding boxes generation mechanism (see Sec. 3) ensures a one-to-one mapping between the cell content and its bounding box for all post-processed datasets."}, {"label": "text", "id": 11, "page_no": 5, "cluster": {"id": 11, "label": "text", "bbox": {"l": 50.112, "t": 448.279, "r": 286.365, "b": 468.786, "coord_origin": "TOPLEFT"}, "confidence": 0.9724196195602417, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 456.831, "r_x1": 286.365, "r_y1": 456.831, "r_x2": 286.365, "r_y2": 448.279, "r_x3": 62.067, "r_y3": 448.279, "coord_origin": "TOPLEFT"}, "text": "The loss used to train the TableFormer can be defined as", "orig": "The loss used to train the TableFormer can be defined as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 468.786, "r_x1": 91.377, "r_y1": 468.786, "r_x2": 91.377, "r_y2": 460.234, "r_x3": 50.112, "r_y3": 460.234, "coord_origin": "TOPLEFT"}, "text": "following:", "orig": "following:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The loss used to train the TableFormer can be defined as following:"}, {"label": "formula", "id": 15, "page_no": 5, "cluster": {"id": 15, "label": "formula", "bbox": {"l": 124.33, "t": 493.391, "r": 286.362, "b": 517.9639999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9423348307609558, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.715, "r_y0": 502.097, "r_x1": 128.688, "r_y1": 502.097, "r_x2": 128.688, "r_y2": 493.391, "r_x3": 125.715, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.688, "r_y0": 503.02, "r_x1": 140.642, "r_y1": 503.02, "r_x2": 140.642, "r_y2": 496.926, "r_x3": 128.688, "r_y3": 496.926, "coord_origin": "TOPLEFT"}, "text": "box", "orig": "box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.907, "r_y0": 502.097, "r_x1": 151.656, "r_y1": 502.097, "r_x2": 151.656, "r_y2": 493.391, "r_x3": 143.907, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.423, "r_y0": 502.097, "r_x1": 160.234, "r_y1": 502.097, "r_x2": 160.234, "r_y2": 493.391, "r_x3": 154.423, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.235, "r_y0": 503.02, "r_x1": 186.628, "r_y1": 503.02, "r_x2": 186.628, "r_y2": 496.926, "r_x3": 160.235, "r_y3": 496.926, "coord_origin": "TOPLEFT"}, "text": "iou iou", "orig": "iou iou", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.194, "r_y0": 502.097, "r_x1": 175.167, "r_y1": 502.097, "r_x2": 175.167, "r_y2": 493.391, "r_x3": 172.194, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 189.34, "r_y0": 502.097, "r_x1": 197.089, "r_y1": 502.097, "r_x2": 197.089, "r_y2": 493.391, "r_x3": 189.34, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "+", "orig": "+", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.303, "r_y0": 502.097, "r_x1": 205.114, "r_y1": 502.097, "r_x2": 205.114, "r_y2": 493.391, "r_x3": 199.303, "r_y3": 493.391, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 205.115, "r_y0": 503.02, "r_x1": 207.635, "r_y1": 503.02, "r_x2": 207.635, "r_y2": 496.926, "r_x3": 205.115, "r_y3": 496.926, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.675, "r_y0": 503.02, "r_x1": 211.647, "r_y1": 503.02, "r_x2": 211.647, "r_y2": 496.926, "r_x3": 207.675, "r_y3": 496.926, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.33, "r_y0": 517.0409999999999, "r_x1": 127.303, "r_y1": 517.0409999999999, "r_x2": 127.303, "r_y2": 508.335, "r_x3": 124.33, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 130.266, "r_y0": 517.0409999999999, "r_x1": 138.015, "r_y1": 517.0409999999999, "r_x2": 138.015, "r_y2": 508.335, "r_x3": 130.266, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.782, "r_y0": 517.0409999999999, "r_x1": 149.566, "r_y1": 517.0409999999999, "r_x2": 149.566, "r_y2": 508.335, "r_x3": 140.782, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "\u03bbl", "orig": "\u03bbl", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.566, "r_y0": 517.9639999999999, "r_x1": 153.326, "r_y1": 517.9639999999999, "r_x2": 153.326, "r_y2": 511.87, "r_x3": 149.566, "r_y3": 511.87, "coord_origin": "TOPLEFT"}, "text": "s", "orig": "s", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 156.039, "r_y0": 517.0409999999999, "r_x1": 174.855, "r_y1": 517.0409999999999, "r_x2": 174.855, "r_y2": 508.335, "r_x3": 156.039, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "+(1", "orig": "+(1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.071, "r_y0": 516.899, "r_x1": 184.82, "r_y1": 516.899, "r_x2": 184.82, "r_y2": 508.335, "r_x3": 177.071, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.033, "r_y0": 517.0409999999999, "r_x1": 199.692, "r_y1": 517.0409999999999, "r_x2": 199.692, "r_y2": 508.335, "r_x3": 187.033, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": "\u03bb l", "orig": "\u03bb l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 192.845, "r_y0": 517.0409999999999, "r_x1": 196.719, "r_y1": 517.0409999999999, "r_x2": 196.719, "r_y2": 508.335, "r_x3": 192.845, "r_y3": 508.335, "coord_origin": "TOPLEFT"}, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.692, "r_y0": 517.9639999999999, "r_x1": 211.646, "r_y1": 517.9639999999999, "r_x2": 211.646, "r_y2": 511.87, "r_x3": 199.692, "r_y3": 511.87, "coord_origin": "TOPLEFT"}, "text": "box", "orig": "box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.746, "r_y0": 509.832, "r_x1": 286.362, "r_y1": 509.832, "r_x2": 286.362, "r_y2": 501.28, "r_x3": 274.746, "r_y3": 501.28, "coord_origin": "TOPLEFT"}, "text": "(1)", "orig": "(1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "l box = \u03bb iou iou l + \u03bb l 1 l = \u03bbl s +(1 -\u03bb l ) box (1)"}, {"label": "text", "id": 16, "page_no": 5, "cluster": {"id": 16, "label": "text", "bbox": {"l": 50.112, "t": 531.26, "r": 281.597, "b": 540.889, "coord_origin": "TOPLEFT"}, "confidence": 0.9363929629325867, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 540.13, "r_x1": 74.451, "r_y1": 540.13, "r_x2": 74.451, "r_y2": 531.578, "r_x3": 50.112, "r_y3": 531.578, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.941, "r_y0": 539.966, "r_x1": 82.752, "r_y1": 539.966, "r_x2": 82.752, "r_y2": 531.26, "r_x3": 76.941, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.52, "r_y0": 539.8240000000001, "r_x1": 92.162, "r_y1": 539.8240000000001, "r_x2": 92.162, "r_y2": 531.26, "r_x3": 85.52, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": "\u2208", "orig": "\u2208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.653, "r_y0": 540.13, "r_x1": 135.599, "r_y1": 540.13, "r_x2": 135.599, "r_y2": 531.578, "r_x3": 94.653, "r_y3": 531.578, "coord_origin": "TOPLEFT"}, "text": "[0, 1], and", "orig": "[0, 1], and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.09, "r_y0": 539.966, "r_x1": 143.901, "r_y1": 539.966, "r_x2": 143.901, "r_y2": 531.26, "r_x3": 138.09, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.901, "r_y0": 540.889, "r_x1": 155.362, "r_y1": 540.889, "r_x2": 155.362, "r_y2": 534.7950000000001, "r_x3": 143.901, "r_y3": 534.7950000000001, "coord_origin": "TOPLEFT"}, "text": "iou", "orig": "iou", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.861, "r_y0": 539.966, "r_x1": 166.104, "r_y1": 539.966, "r_x2": 166.104, "r_y2": 531.26, "r_x3": 155.861, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": ", \u03bb", "orig": ", \u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.1, "r_y0": 540.889, "r_x1": 168.62, "r_y1": 540.889, "r_x2": 168.62, "r_y2": 534.7950000000001, "r_x3": 166.1, "r_y3": 534.7950000000001, "coord_origin": "TOPLEFT"}, "text": "l", "orig": "l", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.66, "r_y0": 540.889, "r_x1": 172.632, "r_y1": 540.889, "r_x2": 172.632, "r_y2": 534.7950000000001, "r_x3": 168.66, "r_y3": 534.7950000000001, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.897, "r_y0": 539.8240000000001, "r_x1": 182.539, "r_y1": 539.8240000000001, "r_x2": 182.539, "r_y2": 531.26, "r_x3": 175.897, "r_y3": 531.26, "coord_origin": "TOPLEFT"}, "text": "\u2208", "orig": "\u2208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.306, "r_y0": 538.064, "r_x1": 192.501, "r_y1": 538.064, "r_x2": 192.501, "r_y2": 533.441, "r_x3": 185.306, "r_y3": 533.441, "coord_origin": "TOPLEFT"}, "text": "R", "orig": "R", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.992, "r_y0": 540.13, "r_x1": 281.597, "r_y1": 540.13, "r_x2": 281.597, "r_y2": 531.578, "r_x3": 194.992, "r_y3": 531.578, "coord_origin": "TOPLEFT"}, "text": "are hyper-parameters.", "orig": "are hyper-parameters.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "where \u03bb \u2208 [0, 1], and \u03bb iou , \u03bb l 1 \u2208 R are hyper-parameters."}, {"label": "section_header", "id": 12, "page_no": 5, "cluster": {"id": 12, "label": "section_header", "bbox": {"l": 50.112, "t": 555.917, "r": 171.983, "b": 566.665, "coord_origin": "TOPLEFT"}, "confidence": 0.9554555416107178, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 566.665, "r_x1": 171.983, "r_y1": 566.665, "r_x2": 171.983, "r_y2": 555.917, "r_x3": 50.112, "r_y3": 555.917, "coord_origin": "TOPLEFT"}, "text": "5. Experimental Results", "orig": "5. Experimental Results", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5. Experimental Results"}, {"label": "section_header", "id": 13, "page_no": 5, "cluster": {"id": 13, "label": "section_header", "bbox": {"l": 50.112, "t": 576.264, "r": 179.175, "b": 586.116, "coord_origin": "TOPLEFT"}, "confidence": 0.9538503289222717, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 586.116, "r_x1": 179.175, "r_y1": 586.116, "r_x2": 179.175, "r_y2": 576.264, "r_x3": 50.112, "r_y3": 576.264, "coord_origin": "TOPLEFT"}, "text": "5.1. Implementation Details", "orig": "5.1. Implementation Details", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.1. Implementation Details"}, {"label": "text", "id": 7, "page_no": 5, "cluster": {"id": 7, "label": "text", "bbox": {"l": 50.112, "t": 595.8240000000001, "r": 286.365, "b": 640.421, "coord_origin": "TOPLEFT"}, "confidence": 0.9856163263320923, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 604.5550000000001, "r_x1": 202.978, "r_y1": 604.5550000000001, "r_x2": 202.978, "r_y2": 596.0029999999999, "r_x3": 62.067, "r_y3": 596.0029999999999, "coord_origin": "TOPLEFT"}, "text": "TableFormer uses ResNet-18 as the", "orig": "TableFormer uses ResNet-18 as the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 205.384, "r_y0": 604.412, "r_x1": 286.36, "r_y1": 604.412, "r_x2": 286.36, "r_y2": 595.8240000000001, "r_x3": 205.384, "r_y3": 595.8240000000001, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Net-", "orig": "CNN Backbone Net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 616.367, "r_x1": 70.037, "r_y1": 616.367, "r_x2": 70.037, "r_y2": 607.779, "r_x3": 50.112, "r_y3": 607.779, "coord_origin": "TOPLEFT"}, "text": "work", "orig": "work", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 616.51, "r_x1": 72.528, "r_y1": 616.51, "r_x2": 72.528, "r_y2": 607.958, "r_x3": 70.037, "r_y3": 607.958, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 77.14, "r_y0": 616.51, "r_x1": 286.365, "r_y1": 616.51, "r_x2": 286.365, "r_y2": 607.958, "r_x3": 77.14, "r_y3": 607.958, "coord_origin": "TOPLEFT"}, "text": "The input images are resized to 448*448 pixels and", "orig": "The input images are resized to 448*448 pixels and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 628.465, "r_x1": 286.365, "r_y1": 628.465, "r_x2": 286.365, "r_y2": 619.913, "r_x3": 50.112, "r_y3": 619.913, "coord_origin": "TOPLEFT"}, "text": "the feature map has a dimension of 28*28. Additionally, we", "orig": "the feature map has a dimension of 28*28. Additionally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 640.421, "r_x1": 207.033, "r_y1": 640.421, "r_x2": 207.033, "r_y2": 631.869, "r_x3": 50.112, "r_y3": 631.869, "coord_origin": "TOPLEFT"}, "text": "enforce the following input constraints:", "orig": "enforce the following input constraints:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TableFormer uses ResNet-18 as the CNN Backbone Network . The input images are resized to 448*448 pixels and the feature map has a dimension of 28*28. Additionally, we enforce the following input constraints:"}, {"label": "formula", "id": 18, "page_no": 5, "cluster": {"id": 18, "label": "formula", "bbox": {"l": 91.661, "t": 654.496, "r": 286.362, "b": 678.31, "coord_origin": "TOPLEFT"}, "confidence": 0.844183623790741, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.661, "r_y0": 663.366, "r_x1": 186.017, "r_y1": 663.366, "r_x2": 186.017, "r_y2": 654.814, "r_x3": 91.661, "r_y3": 654.814, "coord_origin": "TOPLEFT"}, "text": "Image width and height", "orig": "Image width and height", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 188.507, "r_y0": 663.06, "r_x1": 196.256, "r_y1": 663.06, "r_x2": 196.256, "r_y2": 654.496, "r_x3": 188.507, "r_y3": 654.496, "coord_origin": "TOPLEFT"}, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.746, "r_y0": 663.366, "r_x1": 244.813, "r_y1": 663.366, "r_x2": 244.813, "r_y2": 654.814, "r_x3": 198.746, "r_y3": 654.814, "coord_origin": "TOPLEFT"}, "text": "1024 pixels", "orig": "1024 pixels", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.016, "r_y0": 678.31, "r_x1": 186.246, "r_y1": 678.31, "r_x2": 186.246, "r_y2": 669.758, "r_x3": 101.016, "r_y3": 669.758, "coord_origin": "TOPLEFT"}, "text": "Structural tags length", "orig": "Structural tags length", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 188.736, "r_y0": 678.004, "r_x1": 196.485, "r_y1": 678.004, "r_x2": 196.485, "r_y2": 669.44, "r_x3": 188.736, "r_y3": 669.44, "coord_origin": "TOPLEFT"}, "text": "\u2264", "orig": "\u2264", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.975, "r_y0": 678.31, "r_x1": 244.813, "r_y1": 678.31, "r_x2": 244.813, "r_y2": 669.758, "r_x3": 198.975, "r_y3": 669.758, "coord_origin": "TOPLEFT"}, "text": "512 tokens.", "orig": "512 tokens.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.746, "r_y0": 670.938, "r_x1": 286.362, "r_y1": 670.938, "r_x2": 286.362, "r_y2": 662.386, "r_x3": 274.746, "r_y3": 662.386, "coord_origin": "TOPLEFT"}, "text": "(2)", "orig": "(2)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Image width and height \u2264 1024 pixels Structural tags length \u2264 512 tokens. (2)"}, {"label": "text", "id": 10, "page_no": 5, "cluster": {"id": 10, "label": "text", "bbox": {"l": 50.112, "t": 692.559, "r": 286.365, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9724979996681213, "cells": [{"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Although input constraints are used also by other methods,", "orig": "Although input constraints are used also by other methods,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "such as EDD, ours are less restrictive due to the improved", "orig": "such as EDD, ours are less restrictive due to the improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Although input constraints are used also by other methods, such as EDD, ours are less restrictive due to the improved"}, {"label": "text", "id": 9, "page_no": 5, "cluster": {"id": 9, "label": "text", "bbox": {"l": 308.862, "t": 75.47699999999998, "r": 545.115, "b": 107.93899999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9799237847328186, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 545.115, "r_y1": 84.029, "r_x2": 545.115, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "runtime performance and lower memory footprint of Table-", "orig": "runtime performance and lower memory footprint of Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 95.98400000000004, "r_x1": 339.985, "r_y1": 95.98400000000004, "r_x2": 339.985, "r_y2": 87.43200000000002, "r_x3": 308.862, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "Former.", "orig": "Former.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.889, "r_y0": 95.98400000000004, "r_x1": 545.115, "r_y1": 95.98400000000004, "r_x2": 545.115, "r_y2": 87.43200000000002, "r_x3": 346.889, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "This allows to utilize input samples with longer", "orig": "This allows to utilize input samples with longer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 107.93899999999996, "r_x1": 492.961, "r_y1": 107.93899999999996, "r_x2": 492.961, "r_y2": 99.38699999999994, "r_x3": 308.862, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "sequences and images with larger dimensions.", "orig": "sequences and images with larger dimensions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "runtime performance and lower memory footprint of TableFormer. This allows to utilize input samples with longer sequences and images with larger dimensions."}, {"label": "text", "id": 1, "page_no": 5, "cluster": {"id": 1, "label": "text", "bbox": {"l": 308.862, "t": 116.49800000000005, "r": 545.115, "b": 328.288, "coord_origin": "TOPLEFT"}, "confidence": 0.9880930781364441, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 125.04999999999995, "r_x1": 545.115, "r_y1": 125.04999999999995, "r_x2": 545.115, "r_y2": 116.49800000000005, "r_x3": 320.817, "r_y3": 116.49800000000005, "coord_origin": "TOPLEFT"}, "text": "The Transformer Encoder consists of two 'Transformer", "orig": "The Transformer Encoder consists of two 'Transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 137.005, "r_x1": 545.115, "r_y1": 137.005, "r_x2": 545.115, "r_y2": 128.45299999999997, "r_x3": 308.862, "r_y3": 128.45299999999997, "coord_origin": "TOPLEFT"}, "text": "Encoder Layers', with an input feature size of 512, feed", "orig": "Encoder Layers', with an input feature size of 512, feed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 148.96000000000004, "r_x1": 545.115, "r_y1": 148.96000000000004, "r_x2": 545.115, "r_y2": 140.40800000000002, "r_x3": 308.862, "r_y3": 140.40800000000002, "coord_origin": "TOPLEFT"}, "text": "forward network of 1024, and 4 attention heads. As for the", "orig": "forward network of 1024, and 4 attention heads. As for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 160.91499999999996, "r_x1": 545.115, "r_y1": 160.91499999999996, "r_x2": 545.115, "r_y2": 152.36300000000006, "r_x3": 308.862, "r_y3": 152.36300000000006, "coord_origin": "TOPLEFT"}, "text": "Transformer Decoder it is composed of four 'Transformer", "orig": "Transformer Decoder it is composed of four 'Transformer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 172.87, "r_x1": 545.115, "r_y1": 172.87, "r_x2": 545.115, "r_y2": 164.31799999999998, "r_x3": 308.862, "r_y3": 164.31799999999998, "coord_origin": "TOPLEFT"}, "text": "Decoder Layers' with similar input and output dimensions", "orig": "Decoder Layers' with similar input and output dimensions", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 184.82600000000002, "r_x1": 317.161, "r_y1": 184.82600000000002, "r_x2": 317.161, "r_y2": 176.274, "r_x3": 308.862, "r_y3": 176.274, "coord_origin": "TOPLEFT"}, "text": "as", "orig": "as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 321.365, "r_y0": 184.82600000000002, "r_x1": 333.539, "r_y1": 184.82600000000002, "r_x2": 333.539, "r_y2": 176.274, "r_x3": 321.365, "r_y3": 176.274, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.734, "r_y0": 184.82600000000002, "r_x1": 467.218, "r_y1": 184.82600000000002, "r_x2": 467.218, "r_y2": 176.274, "r_x3": 337.734, "r_y3": 176.274, "coord_origin": "TOPLEFT"}, "text": "'Transformer Encoder Layers'.", "orig": "'Transformer Encoder Layers'.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.437, "r_y0": 184.82600000000002, "r_x1": 545.115, "r_y1": 184.82600000000002, "r_x2": 545.115, "r_y2": 176.274, "r_x3": 475.437, "r_y3": 176.274, "coord_origin": "TOPLEFT"}, "text": "Even though our", "orig": "Even though our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 196.78099999999995, "r_x1": 545.115, "r_y1": 196.78099999999995, "r_x2": 545.115, "r_y2": 188.22900000000004, "r_x3": 308.862, "r_y3": 188.22900000000004, "coord_origin": "TOPLEFT"}, "text": "model uses fewer layers and heads than the default imple-", "orig": "model uses fewer layers and heads than the default imple-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 208.736, "r_x1": 399.213, "r_y1": 208.736, "r_x2": 399.213, "r_y2": 200.18399999999997, "r_x3": 308.862, "r_y3": 200.18399999999997, "coord_origin": "TOPLEFT"}, "text": "mentation parameters,", "orig": "mentation parameters,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 403.965, "r_y0": 208.736, "r_x1": 458.63, "r_y1": 208.736, "r_x2": 458.63, "r_y2": 200.18399999999997, "r_x3": 403.965, "r_y3": 200.18399999999997, "coord_origin": "TOPLEFT"}, "text": "our extensive", "orig": "our extensive", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 462.934, "r_y0": 208.736, "r_x1": 545.115, "r_y1": 208.736, "r_x2": 545.115, "r_y2": 200.18399999999997, "r_x3": 462.934, "r_y3": 200.18399999999997, "coord_origin": "TOPLEFT"}, "text": "experimentation has", "orig": "experimentation has", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 220.69100000000003, "r_x1": 527.84, "r_y1": 220.69100000000003, "r_x2": 527.84, "r_y2": 212.139, "r_x3": 308.862, "r_y3": 212.139, "coord_origin": "TOPLEFT"}, "text": "proved this setup to be more suitable for table images.", "orig": "proved this setup to be more suitable for table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.084, "r_y0": 220.69100000000003, "r_x1": 545.115, "r_y1": 220.69100000000003, "r_x2": 545.115, "r_y2": 212.139, "r_x3": 532.084, "r_y3": 212.139, "coord_origin": "TOPLEFT"}, "text": "We", "orig": "We", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 232.64599999999996, "r_x1": 341.868, "r_y1": 232.64599999999996, "r_x2": 341.868, "r_y2": 224.09400000000005, "r_x3": 308.862, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "attribute", "orig": "attribute", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.371, "r_y0": 232.64599999999996, "r_x1": 360.767, "r_y1": 232.64599999999996, "r_x2": 360.767, "r_y2": 224.09400000000005, "r_x3": 346.371, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 365.27, "r_y0": 232.64599999999996, "r_x1": 393.504, "r_y1": 232.64599999999996, "r_x2": 393.504, "r_y2": 224.09400000000005, "r_x3": 365.27, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "finding", "orig": "finding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.007, "r_y0": 232.64599999999996, "r_x1": 405.758, "r_y1": 232.64599999999996, "r_x2": 405.758, "r_y2": 224.09400000000005, "r_x3": 398.007, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.261, "r_y0": 232.64599999999996, "r_x1": 422.436, "r_y1": 232.64599999999996, "r_x2": 422.436, "r_y2": 224.09400000000005, "r_x3": 410.261, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 426.939, "r_y0": 232.64599999999996, "r_x1": 459.586, "r_y1": 232.64599999999996, "r_x2": 459.586, "r_y2": 224.09400000000005, "r_x3": 426.939, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "inherent", "orig": "inherent", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 464.089, "r_y0": 232.64599999999996, "r_x1": 490.102, "r_y1": 232.64599999999996, "r_x2": 490.102, "r_y2": 224.09400000000005, "r_x3": 464.089, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "design", "orig": "design", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 494.605, "r_y0": 232.64599999999996, "r_x1": 502.904, "r_y1": 232.64599999999996, "r_x2": 502.904, "r_y2": 224.09400000000005, "r_x3": 494.605, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "of", "orig": "of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 507.407, "r_y0": 232.64599999999996, "r_x1": 526.774, "r_y1": 232.64599999999996, "r_x2": 526.774, "r_y2": 224.09400000000005, "r_x3": 507.407, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 531.277, "r_y0": 232.64599999999996, "r_x1": 545.115, "r_y1": 232.64599999999996, "r_x2": 545.115, "r_y2": 224.09400000000005, "r_x3": 531.277, "r_y3": 224.09400000000005, "coord_origin": "TOPLEFT"}, "text": "im-", "orig": "im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 244.601, "r_x1": 545.115, "r_y1": 244.601, "r_x2": 545.115, "r_y2": 236.04899999999998, "r_x3": 308.862, "r_y3": 236.04899999999998, "coord_origin": "TOPLEFT"}, "text": "ages, which contain mostly lines and text, unlike the more", "orig": "ages, which contain mostly lines and text, unlike the more", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 256.557, "r_x1": 496.169, "r_y1": 256.557, "r_x2": 496.169, "r_y2": 248.005, "r_x3": 308.862, "r_y3": 248.005, "coord_origin": "TOPLEFT"}, "text": "elaborate content present in other scopes (e.g.", "orig": "elaborate content present in other scopes (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 501.897, "r_y0": 256.557, "r_x1": 545.115, "r_y1": 256.557, "r_x2": 545.115, "r_y2": 248.005, "r_x3": 501.897, "r_y3": 248.005, "coord_origin": "TOPLEFT"}, "text": "the COCO", "orig": "the COCO", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 268.51199999999994, "r_x1": 342.336, "r_y1": 268.51199999999994, "r_x2": 342.336, "r_y2": 259.96000000000004, "r_x3": 308.862, "r_y3": 259.96000000000004, "coord_origin": "TOPLEFT"}, "text": "dataset).", "orig": "dataset).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.952, "r_y0": 268.51199999999994, "r_x1": 545.115, "r_y1": 268.51199999999994, "r_x2": 545.115, "r_y2": 259.96000000000004, "r_x3": 348.952, "r_y3": 259.96000000000004, "coord_origin": "TOPLEFT"}, "text": "Moreover, we have added ResNet blocks to the", "orig": "Moreover, we have added ResNet blocks to the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 280.467, "r_x1": 545.115, "r_y1": 280.467, "r_x2": 545.115, "r_y2": 271.91499999999996, "r_x3": 308.862, "r_y3": 271.91499999999996, "coord_origin": "TOPLEFT"}, "text": "inputs of the Structure Decoder and Cell BBox Decoder.", "orig": "inputs of the Structure Decoder and Cell BBox Decoder.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 292.422, "r_x1": 545.115, "r_y1": 292.422, "r_x2": 545.115, "r_y2": 283.87, "r_x3": 308.862, "r_y3": 283.87, "coord_origin": "TOPLEFT"}, "text": "This prevents a decoder having a stronger influence over the", "orig": "This prevents a decoder having a stronger influence over the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 304.377, "r_x1": 545.115, "r_y1": 304.377, "r_x2": 545.115, "r_y2": 295.825, "r_x3": 308.862, "r_y3": 295.825, "coord_origin": "TOPLEFT"}, "text": "learned weights which would damage the other prediction", "orig": "learned weights which would damage the other prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 316.332, "r_x1": 545.115, "r_y1": 316.332, "r_x2": 545.115, "r_y2": 307.78, "r_x3": 308.862, "r_y3": 307.78, "coord_origin": "TOPLEFT"}, "text": "task (structure vs bounding boxes), but learn task specific", "orig": "task (structure vs bounding boxes), but learn task specific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 328.288, "r_x1": 532.483, "r_y1": 328.288, "r_x2": 532.483, "r_y2": 319.736, "r_x3": 308.862, "r_y3": 319.736, "coord_origin": "TOPLEFT"}, "text": "weights instead. Lastly our dropout layers are set to 0.5.", "orig": "weights instead. Lastly our dropout layers are set to 0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The Transformer Encoder consists of two 'Transformer Encoder Layers', with an input feature size of 512, feed forward network of 1024, and 4 attention heads. As for the Transformer Decoder it is composed of four 'Transformer Decoder Layers' with similar input and output dimensions as the 'Transformer Encoder Layers'. Even though our model uses fewer layers and heads than the default implementation parameters, our extensive experimentation has proved this setup to be more suitable for table images. We attribute this finding to the inherent design of table images, which contain mostly lines and text, unlike the more elaborate content present in other scopes (e.g. the COCO dataset). Moreover, we have added ResNet blocks to the inputs of the Structure Decoder and Cell BBox Decoder. This prevents a decoder having a stronger influence over the learned weights which would damage the other prediction task (structure vs bounding boxes), but learn task specific weights instead. Lastly our dropout layers are set to 0.5."}, {"label": "text", "id": 3, "page_no": 5, "cluster": {"id": 3, "label": "text", "bbox": {"l": 308.862, "t": 336.846, "r": 545.115, "b": 429.084, "coord_origin": "TOPLEFT"}, "confidence": 0.9877589344978333, "cells": [{"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 345.398, "r_x1": 545.115, "r_y1": 345.398, "r_x2": 545.115, "r_y2": 336.846, "r_x3": 320.817, "r_y3": 336.846, "coord_origin": "TOPLEFT"}, "text": "For training, TableFormer is trained with 3 Adam opti-", "orig": "For training, TableFormer is trained with 3 Adam opti-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 357.353, "r_x1": 403.736, "r_y1": 357.353, "r_x2": 403.736, "r_y2": 348.801, "r_x3": 308.862, "r_y3": 348.801, "coord_origin": "TOPLEFT"}, "text": "mizers, each one for the", "orig": "mizers, each one for the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 406.076, "r_y0": 357.21, "r_x1": 545.112, "r_y1": 357.21, "r_x2": 545.112, "r_y2": 348.622, "r_x3": 406.076, "r_y3": 348.622, "coord_origin": "TOPLEFT"}, "text": "CNN Backbone Network Structure", "orig": "CNN Backbone Network Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 503.539, "r_y0": 357.353, "r_x1": 506.03, "r_y1": 357.353, "r_x2": 506.03, "r_y2": 348.801, "r_x3": 503.539, "r_y3": 348.801, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 369.165, "r_x1": 343.163, "r_y1": 369.165, "r_x2": 343.163, "r_y2": 360.577, "r_x3": 308.862, "r_y3": 360.577, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 343.163, "r_y0": 369.308, "r_x1": 362.202, "r_y1": 369.308, "r_x2": 362.202, "r_y2": 360.756, "r_x3": 343.163, "r_y3": 360.756, "coord_origin": "TOPLEFT"}, "text": ", and", "orig": ", and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 364.286, "r_y0": 369.165, "r_x1": 440.938, "r_y1": 369.165, "r_x2": 440.938, "r_y2": 360.577, "r_x3": 364.286, "r_y3": 360.577, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.939, "r_y0": 369.308, "r_x1": 443.43, "r_y1": 369.308, "r_x2": 443.43, "r_y2": 360.756, "r_x3": 440.939, "r_y3": 360.756, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 446.379, "r_y0": 369.308, "r_x1": 545.108, "r_y1": 369.308, "r_x2": 545.108, "r_y2": 360.756, "r_x3": 446.379, "r_y3": 360.756, "coord_origin": "TOPLEFT"}, "text": "Taking the PubTabNet as", "orig": "Taking the PubTabNet as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 381.263, "r_x1": 545.115, "r_y1": 381.263, "r_x2": 545.115, "r_y2": 372.711, "r_x3": 308.862, "r_y3": 372.711, "coord_origin": "TOPLEFT"}, "text": "an example for our parameter set up, the initializing learn-", "orig": "an example for our parameter set up, the initializing learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 393.219, "r_x1": 545.115, "r_y1": 393.219, "r_x2": 545.115, "r_y2": 384.667, "r_x3": 308.862, "r_y3": 384.667, "coord_origin": "TOPLEFT"}, "text": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "orig": "ing rate is 0.001 for 12 epochs with a batch size of 24, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 405.01, "r_x1": 314.673, "r_y1": 405.01, "r_x2": 314.673, "r_y2": 396.304, "r_x3": 308.862, "r_y3": 396.304, "coord_origin": "TOPLEFT"}, "text": "\u03bb", "orig": "\u03bb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.658, "r_y0": 405.174, "r_x1": 329.726, "r_y1": 405.174, "r_x2": 329.726, "r_y2": 396.622, "r_x3": 318.658, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "set", "orig": "set", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.711, "r_y0": 405.174, "r_x1": 341.462, "r_y1": 405.174, "r_x2": 341.462, "r_y2": 396.622, "r_x3": 333.711, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.447, "r_y0": 405.174, "r_x1": 360.391, "r_y1": 405.174, "r_x2": 360.391, "r_y2": 396.622, "r_x3": 345.447, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "0.5.", "orig": "0.5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.963, "r_y0": 405.174, "r_x1": 415.166, "r_y1": 405.174, "r_x2": 415.166, "r_y2": 396.622, "r_x3": 367.963, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "Afterwards,", "orig": "Afterwards,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 419.519, "r_y0": 405.174, "r_x1": 545.108, "r_y1": 405.174, "r_x2": 545.108, "r_y2": 396.622, "r_x3": 419.519, "r_y3": 396.622, "coord_origin": "TOPLEFT"}, "text": "we reduce the learning rate to", "orig": "we reduce the learning rate to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 417.129, "r_x1": 545.115, "r_y1": 417.129, "r_x2": 545.115, "r_y2": 408.577, "r_x3": 308.862, "r_y3": 408.577, "coord_origin": "TOPLEFT"}, "text": "0.0001, the batch size to 18 and train for 12 more epochs or", "orig": "0.0001, the batch size to 18 and train for 12 more epochs or", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 429.084, "r_x1": 360.966, "r_y1": 429.084, "r_x2": 360.966, "r_y2": 420.532, "r_x3": 308.862, "r_y3": 420.532, "coord_origin": "TOPLEFT"}, "text": "convergence.", "orig": "convergence.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "For training, TableFormer is trained with 3 Adam optimizers, each one for the CNN Backbone Network Structure , Decoder , and Cell BBox Decoder . Taking the PubTabNet as an example for our parameter set up, the initializing learning rate is 0.001 for 12 epochs with a batch size of 24, and \u03bb set to 0.5. Afterwards, we reduce the learning rate to 0.0001, the batch size to 18 and train for 12 more epochs or convergence."}, {"label": "text", "id": 0, "page_no": 5, "cluster": {"id": 0, "label": "text", "bbox": {"l": 308.862, "t": 437.643, "r": 545.115, "b": 553.7909999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9884491562843323, "cells": [{"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 446.195, "r_x1": 545.115, "r_y1": 446.195, "r_x2": 545.115, "r_y2": 437.643, "r_x3": 320.817, "r_y3": 437.643, "coord_origin": "TOPLEFT"}, "text": "TableFormer is implemented with PyTorch and Torchvi-", "orig": "TableFormer is implemented with PyTorch and Torchvi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 458.15, "r_x1": 384.628, "r_y1": 458.15, "r_x2": 384.628, "r_y2": 449.598, "r_x3": 308.862, "r_y3": 449.598, "coord_origin": "TOPLEFT"}, "text": "sion libraries [22].", "orig": "sion libraries [22].", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.372, "r_y0": 458.15, "r_x1": 545.115, "r_y1": 458.15, "r_x2": 545.115, "r_y2": 449.598, "r_x3": 391.372, "r_y3": 449.598, "coord_origin": "TOPLEFT"}, "text": "To speed up the inference, the image", "orig": "To speed up the inference, the image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 470.105, "r_x1": 494.007, "r_y1": 470.105, "r_x2": 494.007, "r_y2": 461.553, "r_x3": 308.862, "r_y3": 461.553, "coord_origin": "TOPLEFT"}, "text": "undergoes a single forward pass through the", "orig": "undergoes a single forward pass through the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.078, "r_y0": 469.962, "r_x1": 545.111, "r_y1": 469.962, "r_x2": 545.111, "r_y2": 461.374, "r_x3": 498.078, "r_y3": 461.374, "coord_origin": "TOPLEFT"}, "text": "CNN Back-", "orig": "CNN Back-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 481.917, "r_x1": 364.443, "r_y1": 481.917, "r_x2": 364.443, "r_y2": 473.329, "r_x3": 308.862, "r_y3": 473.329, "coord_origin": "TOPLEFT"}, "text": "bone Network", "orig": "bone Network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.061, "r_y0": 482.06, "r_x1": 545.113, "r_y1": 482.06, "r_x2": 545.113, "r_y2": 473.508, "r_x3": 367.061, "r_y3": 473.508, "coord_origin": "TOPLEFT"}, "text": "and transformer encoder. This eliminates the", "orig": "and transformer encoder. This eliminates the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 494.015, "r_x1": 545.115, "r_y1": 494.015, "r_x2": 545.115, "r_y2": 485.463, "r_x3": 308.862, "r_y3": 485.463, "coord_origin": "TOPLEFT"}, "text": "overhead of generating the same features for each decoding", "orig": "overhead of generating the same features for each decoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 505.97, "r_x1": 545.115, "r_y1": 505.97, "r_x2": 545.115, "r_y2": 497.418, "r_x3": 308.862, "r_y3": 497.418, "coord_origin": "TOPLEFT"}, "text": "step. Similarly, we employ a 'caching' technique to preform", "orig": "step. Similarly, we employ a 'caching' technique to preform", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 517.9259999999999, "r_x1": 432.588, "r_y1": 517.9259999999999, "r_x2": 432.588, "r_y2": 509.374, "r_x3": 308.862, "r_y3": 509.374, "coord_origin": "TOPLEFT"}, "text": "faster autoregressive decoding.", "orig": "faster autoregressive decoding.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.732, "r_y0": 517.9259999999999, "r_x1": 545.115, "r_y1": 517.9259999999999, "r_x2": 545.115, "r_y2": 509.374, "r_x3": 436.732, "r_y3": 509.374, "coord_origin": "TOPLEFT"}, "text": "This is achieved by storing", "orig": "This is achieved by storing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 529.881, "r_x1": 545.115, "r_y1": 529.881, "r_x2": 545.115, "r_y2": 521.329, "r_x3": 308.862, "r_y3": 521.329, "coord_origin": "TOPLEFT"}, "text": "the features of decoded tokens so we can reuse them for", "orig": "the features of decoded tokens so we can reuse them for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 541.836, "r_x1": 370.062, "r_y1": 541.836, "r_x2": 370.062, "r_y2": 533.284, "r_x3": 308.862, "r_y3": 533.284, "coord_origin": "TOPLEFT"}, "text": "each time step.", "orig": "each time step.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.721, "r_y0": 541.836, "r_x1": 545.115, "r_y1": 541.836, "r_x2": 545.115, "r_y2": 533.284, "r_x3": 375.721, "r_y3": 533.284, "coord_origin": "TOPLEFT"}, "text": "Therefore, we only compute the attention", "orig": "Therefore, we only compute the attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 553.7909999999999, "r_x1": 377.215, "r_y1": 553.7909999999999, "r_x2": 377.215, "r_y2": 545.239, "r_x3": 308.862, "r_y3": 545.239, "coord_origin": "TOPLEFT"}, "text": "for each new tag.", "orig": "for each new tag.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TableFormer is implemented with PyTorch and Torchvision libraries [22]. To speed up the inference, the image undergoes a single forward pass through the CNN Backbone Network and transformer encoder. This eliminates the overhead of generating the same features for each decoding step. Similarly, we employ a 'caching' technique to preform faster autoregressive decoding. This is achieved by storing the features of decoded tokens so we can reuse them for each time step. Therefore, we only compute the attention for each new tag."}, {"label": "section_header", "id": 14, "page_no": 5, "cluster": {"id": 14, "label": "section_header", "bbox": {"l": 308.862, "t": 579.554, "r": 397.443, "b": 589.406, "coord_origin": "TOPLEFT"}, "confidence": 0.9450808763504028, "cells": [{"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 589.406, "r_x1": 397.443, "r_y1": 589.406, "r_x2": 397.443, "r_y2": 579.554, "r_x3": 308.862, "r_y3": 579.554, "coord_origin": "TOPLEFT"}, "text": "5.2. Generalization", "orig": "5.2. Generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.2. Generalization"}, {"label": "text", "id": 2, "page_no": 5, "cluster": {"id": 2, "label": "text", "bbox": {"l": 308.862, "t": 603.718, "r": 545.115, "b": 672.046, "coord_origin": "TOPLEFT"}, "confidence": 0.9880595803260803, "cells": [{"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 612.27, "r_x1": 545.115, "r_y1": 612.27, "r_x2": 545.115, "r_y2": 603.718, "r_x3": 320.817, "r_y3": 603.718, "coord_origin": "TOPLEFT"}, "text": "TableFormer is evaluated on three major publicly avail-", "orig": "TableFormer is evaluated on three major publicly avail-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 624.225, "r_x1": 545.115, "r_y1": 624.225, "r_x2": 545.115, "r_y2": 615.673, "r_x3": 308.862, "r_y3": 615.673, "coord_origin": "TOPLEFT"}, "text": "able datasets of different nature to prove the generalization", "orig": "able datasets of different nature to prove the generalization", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 636.1800000000001, "r_x1": 545.115, "r_y1": 636.1800000000001, "r_x2": 545.115, "r_y2": 627.6279999999999, "r_x3": 308.862, "r_y3": 627.6279999999999, "coord_origin": "TOPLEFT"}, "text": "and effectiveness of our model. The datasets used for eval-", "orig": "and effectiveness of our model. The datasets used for eval-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 648.135, "r_x1": 545.115, "r_y1": 648.135, "r_x2": 545.115, "r_y2": 639.583, "r_x3": 308.862, "r_y3": 639.583, "coord_origin": "TOPLEFT"}, "text": "uation are the PubTabNet, FinTabNet and TableBank which", "orig": "uation are the PubTabNet, FinTabNet and TableBank which", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 660.091, "r_x1": 545.115, "r_y1": 660.091, "r_x2": 545.115, "r_y2": 651.539, "r_x3": 308.862, "r_y3": 651.539, "coord_origin": "TOPLEFT"}, "text": "stem from the scientific, financial and general domains re-", "orig": "stem from the scientific, financial and general domains re-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 672.046, "r_x1": 350.705, "r_y1": 672.046, "r_x2": 350.705, "r_y2": 663.494, "r_x3": 308.862, "r_y3": 663.494, "coord_origin": "TOPLEFT"}, "text": "spectively.", "orig": "spectively.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TableFormer is evaluated on three major publicly available datasets of different nature to prove the generalization and effectiveness of our model. The datasets used for evaluation are the PubTabNet, FinTabNet and TableBank which stem from the scientific, financial and general domains respectively."}, {"label": "text", "id": 8, "page_no": 5, "cluster": {"id": 8, "label": "text", "bbox": {"l": 308.862, "t": 680.604, "r": 545.115, "b": 713.067, "coord_origin": "TOPLEFT"}, "confidence": 0.9830910563468933, "cells": [{"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 689.156, "r_x1": 545.115, "r_y1": 689.156, "r_x2": 545.115, "r_y2": 680.604, "r_x3": 320.817, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "We also share our baseline results on the challenging", "orig": "We also share our baseline results on the challenging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 701.111, "r_x1": 361.196, "r_y1": 701.111, "r_x2": 361.196, "r_y2": 692.559, "r_x3": 308.862, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 203, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 366.057, "r_y0": 701.111, "r_x1": 396.214, "r_y1": 701.111, "r_x2": 396.214, "r_y2": 692.559, "r_x3": 366.057, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "dataset.", "orig": "dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 204, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 406.406, "r_y0": 701.111, "r_x1": 453.449, "r_y1": 701.111, "r_x2": 453.449, "r_y2": 692.559, "r_x3": 406.406, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Throughout", "orig": "Throughout", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 205, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.311, "r_y0": 701.111, "r_x1": 471.591, "r_y1": 701.111, "r_x2": 471.591, "r_y2": 692.559, "r_x3": 458.311, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 206, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.453, "r_y0": 701.111, "r_x1": 527.481, "r_y1": 701.111, "r_x2": 527.481, "r_y2": 692.559, "r_x3": 476.453, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "experiments,", "orig": "experiments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 207, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.941, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 532.941, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 208, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.067, "r_x1": 495.94, "r_y1": 713.067, "r_x2": 495.94, "r_y2": 704.515, "r_x3": 308.862, "r_y3": 704.515, "coord_origin": "TOPLEFT"}, "text": "same parameters stated in Sec. 5.1 are utilized.", "orig": "same parameters stated in Sec. 5.1 are utilized.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We also share our baseline results on the challenging SynthTabNet dataset. Throughout our experiments, the same parameters stated in Sec. 5.1 are utilized."}], "headers": [{"label": "page_footer", "id": 17, "page_no": 5, "cluster": {"id": 17, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8820409178733826, "cells": [{"index": 209, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "6"}]}}, {"page_no": 6, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.25300000000004, "r_x1": 167.898, "r_y1": 84.25300000000004, "r_x2": 167.898, "r_y2": 74.40099999999995, "r_x3": 50.112, "r_y3": 74.40099999999995, "coord_origin": "TOPLEFT"}, "text": "5.3. Datasets and Metrics", "orig": "5.3. Datasets and Metrics", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 102.17100000000005, "r_x1": 286.365, "r_y1": 102.17100000000005, "r_x2": 286.365, "r_y2": 93.61900000000003, "r_x3": 62.067, "r_y3": 93.61900000000003, "coord_origin": "TOPLEFT"}, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 114.12599999999998, "r_x1": 286.365, "r_y1": 114.12599999999998, "r_x2": 286.365, "r_y2": 105.57399999999996, "r_x3": 50.112, "r_y3": 105.57399999999996, "coord_origin": "TOPLEFT"}, "text": "ric was introduced in [37]. It represents the prediction, and", "orig": "ric was introduced in [37]. It represents the prediction, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 126.08100000000002, "r_x1": 239.999, "r_y1": 126.08100000000002, "r_x2": 239.999, "r_y2": 117.529, "r_x3": 50.112, "r_y3": 117.529, "coord_origin": "TOPLEFT"}, "text": "ground-truth as a tree structure of HTML tags.", "orig": "ground-truth as a tree structure of HTML tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.03, "r_y0": 126.08100000000002, "r_x1": 286.365, "r_y1": 126.08100000000002, "r_x2": 286.365, "r_y2": 117.529, "r_x3": 245.03, "r_y3": 117.529, "coord_origin": "TOPLEFT"}, "text": "This simi-", "orig": "This simi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 138.03700000000003, "r_x1": 136.717, "r_y1": 138.03700000000003, "r_x2": 136.717, "r_y2": 129.485, "r_x3": 50.112, "r_y3": 129.485, "coord_origin": "TOPLEFT"}, "text": "larity is calculated as:", "orig": "larity is calculated as:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.219, "r_y0": 165.87400000000002, "r_x1": 118.878, "r_y1": 165.87400000000002, "r_x2": 118.878, "r_y2": 157.168, "r_x3": 86.219, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": "TEDS(", "orig": "TEDS(", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 118.875, "r_y0": 165.87400000000002, "r_x1": 139.77, "r_y1": 165.87400000000002, "r_x2": 139.77, "r_y2": 157.168, "r_x3": 118.875, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": "T , T", "orig": "T , T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.697, "r_y0": 166.798, "r_x1": 129.019, "r_y1": 166.798, "r_x2": 129.019, "r_y2": 160.70399999999995, "r_x3": 124.697, "r_y3": 160.70399999999995, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.766, "r_y0": 166.798, "r_x1": 143.27, "r_y1": 166.798, "r_x2": 143.27, "r_y2": 160.70399999999995, "r_x3": 139.766, "r_y3": 160.70399999999995, "coord_origin": "TOPLEFT"}, "text": "b", "orig": "b", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.768, "r_y0": 165.87400000000002, "r_x1": 165.902, "r_y1": 165.87400000000002, "r_x2": 165.902, "r_y2": 157.168, "r_x3": 143.768, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": ") = 1", "orig": ") = 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.121, "r_y0": 165.73199999999997, "r_x1": 175.87, "r_y1": 165.73199999999997, "r_x2": 175.87, "r_y2": 157.168, "r_x3": 168.121, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 179.279, "r_y0": 159.13400000000001, "r_x1": 221.957, "r_y1": 159.13400000000001, "r_x2": 221.957, "r_y2": 150.428, "r_x3": 179.279, "r_y3": 150.428, "coord_origin": "TOPLEFT"}, "text": "EditDist (", "orig": "EditDist (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.952, "r_y0": 159.13400000000001, "r_x1": 242.848, "r_y1": 159.13400000000001, "r_x2": 242.848, "r_y2": 150.428, "r_x3": 221.952, "r_y3": 150.428, "coord_origin": "TOPLEFT"}, "text": "T , T", "orig": "T , T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.774, "r_y0": 160.058, "r_x1": 232.096, "r_y1": 160.058, "r_x2": 232.096, "r_y2": 153.96400000000006, "r_x3": 227.774, "r_y3": 153.96400000000006, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.843, "r_y0": 160.058, "r_x1": 246.347, "r_y1": 160.058, "r_x2": 246.347, "r_y2": 153.96400000000006, "r_x3": 242.843, "r_y3": 153.96400000000006, "coord_origin": "TOPLEFT"}, "text": "b", "orig": "b", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.845, "r_y0": 159.13400000000001, "r_x1": 250.719, "r_y1": 159.13400000000001, "r_x2": 250.719, "r_y2": 150.428, "r_x3": 246.845, "r_y3": 150.428, "coord_origin": "TOPLEFT"}, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.212, "r_y0": 172.70799999999997, "r_x1": 206.292, "r_y1": 172.70799999999997, "r_x2": 206.292, "r_y2": 164.00199999999995, "r_x3": 182.212, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "max(", "orig": "max(", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.289, "r_y0": 172.56600000000003, "r_x1": 209.057, "r_y1": 172.56600000000003, "r_x2": 209.057, "r_y2": 164.00199999999995, "r_x3": 206.289, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.056, "r_y0": 172.70799999999997, "r_x1": 214.878, "r_y1": 172.70799999999997, "r_x2": 214.878, "r_y2": 164.00199999999995, "r_x3": 209.056, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.878, "r_y0": 173.63199999999995, "r_x1": 219.2, "r_y1": 173.63199999999995, "r_x2": 219.2, "r_y2": 167.538, "r_x3": 214.878, "r_y3": 167.538, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.697, "r_y0": 172.56600000000003, "r_x1": 222.465, "r_y1": 172.56600000000003, "r_x2": 222.465, "r_y2": 164.00199999999995, "r_x3": 219.697, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.125, "r_y0": 172.70799999999997, "r_x1": 226.893, "r_y1": 172.70799999999997, "r_x2": 226.893, "r_y2": 164.00199999999995, "r_x3": 224.125, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.553, "r_y0": 172.56600000000003, "r_x1": 231.321, "r_y1": 172.56600000000003, "r_x2": 231.321, "r_y2": 164.00199999999995, "r_x3": 228.553, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 231.32, "r_y0": 172.70799999999997, "r_x1": 237.142, "r_y1": 172.70799999999997, "r_x2": 237.142, "r_y2": 164.00199999999995, "r_x3": 231.32, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 237.142, "r_y0": 173.63199999999995, "r_x1": 240.646, "r_y1": 173.63199999999995, "r_x2": 240.646, "r_y2": 167.538, "r_x3": 237.142, "r_y3": 167.538, "coord_origin": "TOPLEFT"}, "text": "b", "orig": "b", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.144, "r_y0": 172.56600000000003, "r_x1": 243.912, "r_y1": 172.56600000000003, "r_x2": 243.912, "r_y2": 164.00199999999995, "r_x3": 241.144, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.911, "r_y0": 172.70799999999997, "r_x1": 247.785, "r_y1": 172.70799999999997, "r_x2": 247.785, "r_y2": 164.00199999999995, "r_x3": 243.911, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.746, "r_y0": 166.038, "r_x1": 286.362, "r_y1": 166.038, "r_x2": 286.362, "r_y2": 157.486, "r_x3": 274.746, "r_y3": 157.486, "coord_origin": "TOPLEFT"}, "text": "(3)", "orig": "(3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 189.98299999999995, "r_x1": 86.406, "r_y1": 189.98299999999995, "r_x2": 86.406, "r_y2": 181.43100000000004, "r_x3": 62.067, "r_y3": 181.43100000000004, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.581, "r_y0": 189.81899999999996, "r_x1": 94.403, "r_y1": 189.81899999999996, "r_x2": 94.403, "r_y2": 181.11300000000006, "r_x3": 88.581, "r_y3": 181.11300000000006, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.403, "r_y0": 190.74199999999996, "r_x1": 98.725, "r_y1": 190.74199999999996, "r_x2": 98.725, "r_y2": 184.64800000000002, "r_x3": 94.403, "r_y3": 184.64800000000002, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.399, "r_y0": 189.98299999999995, "r_x1": 115.785, "r_y1": 189.98299999999995, "r_x2": 115.785, "r_y2": 181.43100000000004, "r_x3": 101.399, "r_y3": 181.43100000000004, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 117.961, "r_y0": 189.81899999999996, "r_x1": 123.783, "r_y1": 189.81899999999996, "r_x2": 123.783, "r_y2": 181.11300000000006, "r_x3": 117.961, "r_y3": 181.11300000000006, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 123.783, "r_y0": 190.74199999999996, "r_x1": 127.287, "r_y1": 190.74199999999996, "r_x2": 127.287, "r_y2": 184.64800000000002, "r_x3": 123.783, "r_y3": 184.64800000000002, "coord_origin": "TOPLEFT"}, "text": "b", "orig": "b", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.96, "r_y0": 189.98299999999995, "r_x1": 286.363, "r_y1": 189.98299999999995, "r_x2": 286.363, "r_y2": 181.43100000000004, "r_x3": 129.96, "r_y3": 181.43100000000004, "coord_origin": "TOPLEFT"}, "text": "represent tables in tree structure HTML", "orig": "represent tables in tree structure HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 201.938, "r_x1": 252.781, "r_y1": 201.938, "r_x2": 252.781, "r_y2": 193.38599999999997, "r_x3": 50.112, "r_y3": 193.38599999999997, "coord_origin": "TOPLEFT"}, "text": "format. EditDist denotes the tree-edit distance, and", "orig": "format. EditDist denotes the tree-edit distance, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.182, "r_y0": 201.63199999999995, "r_x1": 257.95, "r_y1": 201.63199999999995, "r_x2": 257.95, "r_y2": 193.06799999999998, "r_x3": 255.182, "r_y3": 193.06799999999998, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.949, "r_y0": 201.774, "r_x1": 263.771, "r_y1": 201.774, "r_x2": 263.771, "r_y2": 193.06799999999998, "r_x3": 257.949, "r_y3": 193.06799999999998, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.155, "r_y0": 201.63199999999995, "r_x1": 267.923, "r_y1": 201.63199999999995, "r_x2": 267.923, "r_y2": 193.06799999999998, "r_x3": 265.155, "r_y3": 193.06799999999998, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.322, "r_y0": 201.938, "r_x1": 286.362, "r_y1": 201.938, "r_x2": 286.362, "r_y2": 193.38599999999997, "r_x3": 270.322, "r_y3": 193.38599999999997, "coord_origin": "TOPLEFT"}, "text": "rep-", "orig": "rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 213.89300000000003, "r_x1": 172.134, "r_y1": 213.89300000000003, "r_x2": 172.134, "r_y2": 205.341, "r_x3": 50.112, "r_y3": 205.341, "coord_origin": "TOPLEFT"}, "text": "resents the number of nodes in", "orig": "resents the number of nodes in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 174.624, "r_y0": 213.72900000000004, "r_x1": 180.446, "r_y1": 213.72900000000004, "r_x2": 180.446, "r_y2": 205.02300000000002, "r_x3": 174.624, "r_y3": 205.02300000000002, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.829, "r_y0": 213.89300000000003, "r_x1": 184.32, "r_y1": 213.89300000000003, "r_x2": 184.32, "r_y2": 205.341, "r_x3": 181.829, "r_y3": 205.341, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 234.67100000000005, "r_x1": 170.452, "r_y1": 234.67100000000005, "r_x2": 170.452, "r_y2": 224.81899999999996, "r_x3": 50.112, "r_y3": 224.81899999999996, "coord_origin": "TOPLEFT"}, "text": "5.4. Quantitative Analysis", "orig": "5.4. Quantitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 252.606, "r_x1": 105.325, "r_y1": 252.606, "r_x2": 105.325, "r_y2": 243.64999999999998, "r_x3": 62.067, "r_y3": 243.64999999999998, "coord_origin": "TOPLEFT"}, "text": "Structure.", "orig": "Structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.126, "r_y0": 252.59000000000003, "r_x1": 184.684, "r_y1": 252.59000000000003, "r_x2": 184.684, "r_y2": 244.038, "r_x3": 112.126, "r_y3": 244.038, "coord_origin": "TOPLEFT"}, "text": "As shown in Tab.", "orig": "As shown in Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 191.478, "r_y0": 252.59000000000003, "r_x1": 198.95, "r_y1": 252.59000000000003, "r_x2": 198.95, "r_y2": 244.038, "r_x3": 191.478, "r_y3": 244.038, "coord_origin": "TOPLEFT"}, "text": "2,", "orig": "2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 202.995, "r_y0": 252.59000000000003, "r_x1": 286.362, "r_y1": 252.59000000000003, "r_x2": 286.362, "r_y2": 244.038, "r_x3": 202.995, "r_y3": 244.038, "coord_origin": "TOPLEFT"}, "text": "TableFormer outper-", "orig": "TableFormer outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 264.54499999999996, "r_x1": 286.365, "r_y1": 264.54499999999996, "r_x2": 286.365, "r_y2": 255.99300000000005, "r_x3": 50.112, "r_y3": 255.99300000000005, "coord_origin": "TOPLEFT"}, "text": "forms all SOTA methods across different datasets by a large", "orig": "forms all SOTA methods across different datasets by a large", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 276.5, "r_x1": 138.719, "r_y1": 276.5, "r_x2": 138.719, "r_y2": 267.948, "r_x3": 50.112, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "margin for predicting", "orig": "margin for predicting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.993, "r_y0": 276.5, "r_x1": 155.168, "r_y1": 276.5, "r_x2": 155.168, "r_y2": 267.948, "r_x3": 142.993, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.432, "r_y0": 276.5, "r_x1": 178.799, "r_y1": 276.5, "r_x2": 178.799, "r_y2": 267.948, "r_x3": 159.432, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.073, "r_y0": 276.5, "r_x1": 217.932, "r_y1": 276.5, "r_x2": 217.932, "r_y2": 267.948, "r_x3": 183.073, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.206, "r_y0": 276.5, "r_x1": 286.365, "r_y1": 276.5, "r_x2": 286.365, "r_y2": 267.948, "r_x3": 222.206, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "from an image.", "orig": "from an image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 288.455, "r_x1": 286.365, "r_y1": 288.455, "r_x2": 286.365, "r_y2": 279.903, "r_x3": 50.112, "r_y3": 279.903, "coord_origin": "TOPLEFT"}, "text": "All the more, our model outperforms pre-trained methods.", "orig": "All the more, our model outperforms pre-trained methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 300.411, "r_x1": 286.365, "r_y1": 300.411, "r_x2": 286.365, "r_y2": 291.859, "r_x3": 50.112, "r_y3": 291.859, "coord_origin": "TOPLEFT"}, "text": "During the evaluation we do not apply any table filtering.", "orig": "During the evaluation we do not apply any table filtering.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 312.366, "r_x1": 286.365, "r_y1": 312.366, "r_x2": 286.365, "r_y2": 303.814, "r_x3": 50.112, "r_y3": 303.814, "coord_origin": "TOPLEFT"}, "text": "We also provide our baseline results on the SynthTabNet", "orig": "We also provide our baseline results on the SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 324.321, "r_x1": 80.269, "r_y1": 324.321, "r_x2": 80.269, "r_y2": 315.769, "r_x3": 50.112, "r_y3": 315.769, "coord_origin": "TOPLEFT"}, "text": "dataset.", "orig": "dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.579, "r_y0": 324.321, "r_x1": 91.666, "r_y1": 324.321, "r_x2": 91.666, "r_y2": 315.769, "r_x3": 85.579, "r_y3": 315.769, "coord_origin": "TOPLEFT"}, "text": "It", "orig": "It", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.894, "r_y0": 324.321, "r_x1": 257.812, "r_y1": 324.321, "r_x2": 257.812, "r_y2": 315.769, "r_x3": 94.894, "r_y3": 315.769, "coord_origin": "TOPLEFT"}, "text": "has been observed that large tables (e.g.", "orig": "has been observed that large tables (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.122, "r_y0": 324.321, "r_x1": 286.365, "r_y1": 324.321, "r_x2": 286.365, "r_y2": 315.769, "r_x3": 263.122, "r_y3": 315.769, "coord_origin": "TOPLEFT"}, "text": "tables", "orig": "tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 336.276, "r_x1": 286.365, "r_y1": 336.276, "r_x2": 286.365, "r_y2": 327.724, "r_x3": 50.112, "r_y3": 327.724, "coord_origin": "TOPLEFT"}, "text": "that occupy half of the page or more) yield poor predictions.", "orig": "that occupy half of the page or more) yield poor predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 348.231, "r_x1": 286.365, "r_y1": 348.231, "r_x2": 286.365, "r_y2": 339.679, "r_x3": 50.112, "r_y3": 339.679, "coord_origin": "TOPLEFT"}, "text": "We attribute this issue to the image resizing during the pre-", "orig": "We attribute this issue to the image resizing during the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 360.186, "r_x1": 115.068, "r_y1": 360.186, "r_x2": 115.068, "r_y2": 351.634, "r_x3": 50.112, "r_y3": 351.634, "coord_origin": "TOPLEFT"}, "text": "processing step,", "orig": "processing step,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.203, "r_y0": 360.186, "r_x1": 134.147, "r_y1": 360.186, "r_x2": 134.147, "r_y2": 351.634, "r_x3": 119.203, "r_y3": 351.634, "coord_origin": "TOPLEFT"}, "text": "that", "orig": "that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.952, "r_y0": 360.186, "r_x1": 286.365, "r_y1": 360.186, "r_x2": 286.365, "r_y2": 351.634, "r_x3": 137.952, "r_y3": 351.634, "coord_origin": "TOPLEFT"}, "text": "produces downsampled images with", "orig": "produces downsampled images with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 372.142, "r_x1": 155.357, "r_y1": 372.142, "r_x2": 155.357, "r_y2": 363.59, "r_x3": 50.112, "r_y3": 363.59, "coord_origin": "TOPLEFT"}, "text": "indistinguishable features.", "orig": "indistinguishable features.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.378, "r_y0": 372.142, "r_x1": 286.365, "r_y1": 372.142, "r_x2": 286.365, "r_y2": 363.59, "r_x3": 160.378, "r_y3": 363.59, "coord_origin": "TOPLEFT"}, "text": "This problem can be addressed", "orig": "This problem can be addressed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 384.097, "r_x1": 286.365, "r_y1": 384.097, "r_x2": 286.365, "r_y2": 375.545, "r_x3": 50.112, "r_y3": 375.545, "coord_origin": "TOPLEFT"}, "text": "by treating such big tables with a separate model which ac-", "orig": "by treating such big tables with a separate model which ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 396.052, "r_x1": 170.012, "r_y1": 396.052, "r_x2": 170.012, "r_y2": 387.5, "r_x3": 50.112, "r_y3": 387.5, "coord_origin": "TOPLEFT"}, "text": "cepts a large input image size.", "orig": "cepts a large input image size.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.843, "r_y0": 429.511, "r_x1": 104.855, "r_y1": 429.511, "r_x2": 104.855, "r_y2": 420.959, "r_x3": 78.843, "r_y3": 420.959, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.2, "r_y0": 423.533, "r_x1": 236.107, "r_y1": 423.533, "r_x2": 236.107, "r_y2": 414.981, "r_x3": 211.2, "r_y3": 414.981, "coord_origin": "TOPLEFT"}, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.338, "r_y0": 435.488, "r_x1": 159.216, "r_y1": 435.488, "r_x2": 159.216, "r_y2": 426.936, "r_x3": 129.338, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.171, "r_y0": 435.488, "r_x1": 199.405, "r_y1": 435.488, "r_x2": 199.405, "r_y2": 426.936, "r_x3": 171.171, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.36, "r_y0": 435.488, "r_x1": 247.744, "r_y1": 435.488, "r_x2": 247.744, "r_y2": 426.936, "r_x3": 211.36, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.54, "r_y0": 435.488, "r_x1": 277.273, "r_y1": 435.488, "r_x2": 277.273, "r_y2": 426.936, "r_x3": 264.54, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 452.445, "r_x1": 102.085, "r_y1": 452.445, "r_x2": 102.085, "r_y2": 443.893, "r_x3": 81.612, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.872, "r_y0": 452.445, "r_x1": 153.691, "r_y1": 452.445, "r_x2": 153.691, "r_y2": 443.893, "r_x3": 134.872, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 452.445, "r_x1": 194.0, "r_y1": 452.445, "r_x2": 194.0, "r_y2": 443.893, "r_x3": 176.566, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.829, "r_y0": 452.445, "r_x1": 238.264, "r_y1": 452.445, "r_x2": 238.264, "r_y2": 443.893, "r_x3": 220.829, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 452.445, "r_x1": 279.619, "r_y1": 452.445, "r_x2": 279.619, "r_y2": 443.893, "r_x3": 262.184, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.165, "r_y0": 464.401, "r_x1": 101.532, "r_y1": 464.401, "r_x2": 101.532, "r_y2": 455.849, "r_x3": 82.165, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.867, "r_y0": 464.401, "r_x1": 153.687, "r_y1": 464.401, "r_x2": 153.687, "r_y2": 455.849, "r_x3": 134.867, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.624, "r_y0": 464.401, "r_x1": 186.942, "r_y1": 464.401, "r_x2": 186.942, "r_y2": 455.849, "r_x3": 183.624, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 464.401, "r_x1": 231.205, "r_y1": 464.401, "r_x2": 231.205, "r_y2": 455.849, "r_x3": 227.888, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.699, "r_y0": 464.401, "r_x1": 282.114, "r_y1": 464.401, "r_x2": 282.114, "r_y2": 455.849, "r_x3": 259.699, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 476.954, "r_x1": 117.383, "r_y1": 476.954, "r_x2": 117.383, "r_y2": 468.402, "r_x3": 66.315, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 476.954, "r_x1": 153.687, "r_y1": 476.954, "r_x2": 153.687, "r_y2": 468.402, "r_x3": 134.868, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 476.954, "r_x1": 194.006, "r_y1": 476.954, "r_x2": 194.006, "r_y2": 468.402, "r_x3": 176.571, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 476.954, "r_x1": 238.269, "r_y1": 476.954, "r_x2": 238.269, "r_y2": 468.402, "r_x3": 220.835, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.698, "r_y0": 476.97, "r_x1": 282.114, "r_y1": 476.97, "r_x2": 282.114, "r_y2": 468.014, "r_x3": 259.698, "r_y3": 468.014, "coord_origin": "TOPLEFT"}, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 492.147, "r_x1": 102.085, "r_y1": 492.147, "r_x2": 102.085, "r_y2": 483.595, "r_x3": 81.612, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.872, "r_y0": 492.147, "r_x1": 153.691, "r_y1": 492.147, "r_x2": 153.691, "r_y2": 483.595, "r_x3": 134.872, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 492.147, "r_x1": 194.0, "r_y1": 492.147, "r_x2": 194.0, "r_y2": 483.595, "r_x3": 176.566, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 218.339, "r_y0": 492.147, "r_x1": 240.755, "r_y1": 492.147, "r_x2": 240.755, "r_y2": 483.595, "r_x3": 218.339, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 492.147, "r_x1": 279.619, "r_y1": 492.147, "r_x2": 279.619, "r_y2": 483.595, "r_x3": 262.184, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.165, "r_y0": 504.102, "r_x1": 101.532, "r_y1": 504.102, "r_x2": 101.532, "r_y2": 495.55, "r_x3": 82.165, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.867, "r_y0": 504.102, "r_x1": 153.687, "r_y1": 504.102, "r_x2": 153.687, "r_y2": 495.55, "r_x3": 134.867, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.624, "r_y0": 504.102, "r_x1": 186.942, "r_y1": 504.102, "r_x2": 186.942, "r_y2": 495.55, "r_x3": 183.624, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 504.102, "r_x1": 231.205, "r_y1": 504.102, "r_x2": 231.205, "r_y2": 495.55, "r_x3": 227.888, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.699, "r_y0": 504.102, "r_x1": 282.114, "r_y1": 504.102, "r_x2": 282.114, "r_y2": 495.55, "r_x3": 259.699, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 71.789, "r_y0": 516.057, "r_x1": 111.908, "r_y1": 516.057, "r_x2": 111.908, "r_y2": 507.505, "r_x3": 71.789, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.862, "r_y0": 516.057, "r_x1": 153.682, "r_y1": 516.057, "r_x2": 153.682, "r_y2": 507.505, "r_x3": 134.862, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.629, "r_y0": 516.057, "r_x1": 186.947, "r_y1": 516.057, "r_x2": 186.947, "r_y2": 507.505, "r_x3": 183.629, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.893, "r_y0": 516.057, "r_x1": 231.211, "r_y1": 516.057, "r_x2": 231.211, "r_y2": 507.505, "r_x3": 227.893, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.694, "r_y0": 516.057, "r_x1": 282.109, "r_y1": 516.057, "r_x2": 282.109, "r_y2": 507.505, "r_x3": 259.694, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 528.012, "r_x1": 117.383, "r_y1": 528.012, "r_x2": 117.383, "r_y2": 519.46, "r_x3": 66.315, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 528.012, "r_x1": 153.687, "r_y1": 528.012, "r_x2": 153.687, "r_y2": 519.46, "r_x3": 134.868, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 528.012, "r_x1": 194.006, "r_y1": 528.012, "r_x2": 194.006, "r_y2": 519.46, "r_x3": 176.571, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 528.012, "r_x1": 238.269, "r_y1": 528.012, "r_x2": 238.269, "r_y2": 519.46, "r_x3": 220.835, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.189, "r_y0": 528.028, "r_x1": 279.624, "r_y1": 528.028, "r_x2": 279.624, "r_y2": 519.072, "r_x3": 262.189, "r_y3": 519.072, "coord_origin": "TOPLEFT"}, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 545.319, "r_x1": 102.085, "r_y1": 545.319, "r_x2": 102.085, "r_y2": 536.767, "r_x3": 81.612, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.911, "r_y0": 545.319, "r_x1": 150.643, "r_y1": 545.319, "r_x2": 150.643, "r_y2": 536.767, "r_x3": 137.911, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 545.319, "r_x1": 194.0, "r_y1": 545.319, "r_x2": 194.0, "r_y2": 536.767, "r_x3": 176.566, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.893, "r_y0": 545.319, "r_x1": 231.21, "r_y1": 545.319, "r_x2": 231.21, "r_y2": 536.767, "r_x3": 227.893, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 545.319, "r_x1": 279.619, "r_y1": 545.319, "r_x2": 279.619, "r_y2": 536.767, "r_x3": 262.184, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 557.275, "r_x1": 117.383, "r_y1": 557.275, "r_x2": 117.383, "r_y2": 548.723, "r_x3": 66.315, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.906, "r_y0": 557.275, "r_x1": 150.638, "r_y1": 557.275, "r_x2": 150.638, "r_y2": 548.723, "r_x3": 137.906, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 557.275, "r_x1": 194.006, "r_y1": 557.275, "r_x2": 194.006, "r_y2": 548.723, "r_x3": 176.571, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 557.275, "r_x1": 231.206, "r_y1": 557.275, "r_x2": 231.206, "r_y2": 548.723, "r_x3": 227.888, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.189, "r_y0": 557.2909999999999, "r_x1": 279.624, "r_y1": 557.2909999999999, "r_x2": 279.624, "r_y2": 548.335, "r_x3": 262.189, "r_y3": 548.335, "coord_origin": "TOPLEFT"}, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 576.823, "r_x1": 117.383, "r_y1": 576.823, "r_x2": 117.383, "r_y2": 568.271, "r_x3": 66.315, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 576.823, "r_x1": 153.687, "r_y1": 576.823, "r_x2": 153.687, "r_y2": 568.271, "r_x3": 134.868, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 576.823, "r_x1": 194.006, "r_y1": 576.823, "r_x2": 194.006, "r_y2": 568.271, "r_x3": 176.571, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 576.823, "r_x1": 238.269, "r_y1": 576.823, "r_x2": 238.269, "r_y2": 568.271, "r_x3": 220.835, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.19, "r_y0": 576.823, "r_x1": 279.624, "r_y1": 576.823, "r_x2": 279.624, "r_y2": 568.271, "r_x3": 262.19, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 601.254, "r_x1": 82.062, "r_y1": 601.254, "r_x2": 82.062, "r_y2": 592.702, "r_x3": 50.112, "r_y3": 592.702, "coord_origin": "TOPLEFT"}, "text": "Table 2:", "orig": "Table 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.382, "r_y0": 601.254, "r_x1": 286.365, "r_y1": 601.254, "r_x2": 286.365, "r_y2": 592.702, "r_x3": 87.382, "r_y3": 592.702, "coord_origin": "TOPLEFT"}, "text": "Structure results on PubTabNet (PTN), FinTabNet", "orig": "Structure results on PubTabNet (PTN), FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 613.2090000000001, "r_x1": 247.461, "r_y1": 613.2090000000001, "r_x2": 247.461, "r_y2": 604.657, "r_x3": 50.112, "r_y3": 604.657, "coord_origin": "TOPLEFT"}, "text": "(FTN), TableBank (TB) and SynthTabNet (STN).", "orig": "(FTN), TableBank (TB) and SynthTabNet (STN).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 625.164, "r_x1": 261.787, "r_y1": 625.164, "r_x2": 261.787, "r_y2": 616.612, "r_x3": 50.112, "r_y3": 616.612, "coord_origin": "TOPLEFT"}, "text": "FT: Model was trained on PubTabNet then finetuned.", "orig": "FT: Model was trained on PubTabNet then finetuned.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 653.306, "r_x1": 124.722, "r_y1": 653.306, "r_x2": 124.722, "r_y2": 644.35, "r_x3": 62.067, "r_y3": 644.35, "coord_origin": "TOPLEFT"}, "text": "Cell Detection.", "orig": "Cell Detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.204, "r_y0": 653.29, "r_x1": 242.933, "r_y1": 653.29, "r_x2": 242.933, "r_y2": 644.738, "r_x3": 128.204, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "Like any object detector, our", "orig": "Like any object detector, our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.554, "r_y0": 653.1469999999999, "r_x1": 286.361, "r_y1": 653.1469999999999, "r_x2": 286.361, "r_y2": 644.559, "r_x3": 245.554, "r_y3": 644.559, "coord_origin": "TOPLEFT"}, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 665.102, "r_x1": 84.971, "r_y1": 665.102, "r_x2": 84.971, "r_y2": 656.514, "r_x3": 50.112, "r_y3": 656.514, "coord_origin": "TOPLEFT"}, "text": "Detector", "orig": "Detector", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 89.515, "r_y0": 665.245, "r_x1": 123.677, "r_y1": 665.245, "r_x2": 123.677, "r_y2": 656.693, "r_x3": 89.515, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "provides", "orig": "provides", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 127.991, "r_y0": 665.245, "r_x1": 286.366, "r_y1": 665.245, "r_x2": 286.366, "r_y2": 656.693, "r_x3": 127.991, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "bounding boxes that can be improved", "orig": "bounding boxes that can be improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.2, "r_x1": 286.365, "r_y1": 677.2, "r_x2": 286.365, "r_y2": 668.648, "r_x3": 50.112, "r_y3": 668.648, "coord_origin": "TOPLEFT"}, "text": "with post-processing during inference. We make use of the", "orig": "with post-processing during inference. We make use of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 259.655, "r_y1": 689.156, "r_x2": 259.655, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "grid-like structure of tables to refine the predictions.", "orig": "grid-like structure of tables to refine the predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.65, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 263.65, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "A de-", "orig": "A de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "tailed explanation on the post-processing is available in the", "orig": "tailed explanation on the post-processing is available in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 147.068, "r_y1": 713.066, "r_x2": 147.068, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "supplementary material.", "orig": "supplementary material.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.159, "r_y0": 713.066, "r_x1": 223.003, "r_y1": 713.066, "r_x2": 223.003, "r_y2": 704.514, "r_x3": 152.159, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "As shown in Tab.", "orig": "As shown in Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.094, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 228.094, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "3, we evaluate", "orig": "3, we evaluate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 322.142, "r_y1": 84.029, "r_x2": 322.142, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 325.454, "r_y0": 83.88599999999997, "r_x1": 404.567, "r_y1": 83.88599999999997, "r_x2": 404.567, "r_y2": 75.298, "r_x3": 325.454, "r_y3": 75.298, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.104, "r_y0": 84.029, "r_x1": 545.11, "r_y1": 84.029, "r_x2": 545.11, "r_y2": 75.47699999999998, "r_x3": 408.104, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "accuracy for cells with a class la-", "orig": "accuracy for cells with a class la-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 95.98400000000004, "r_x1": 545.115, "r_y1": 95.98400000000004, "r_x2": 545.115, "r_y2": 87.43200000000002, "r_x3": 308.862, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "bel of 'content' only using the PASCAL VOC mAP metric", "orig": "bel of 'content' only using the PASCAL VOC mAP metric", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 107.93899999999996, "r_x1": 320.478, "r_y1": 107.93899999999996, "r_x2": 320.478, "r_y2": 99.38699999999994, "r_x3": 308.862, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 324.374, "r_y0": 107.93899999999996, "r_x1": 470.226, "r_y1": 107.93899999999996, "r_x2": 470.226, "r_y2": 99.38699999999994, "r_x3": 324.374, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "pre-processing and post-processing.", "orig": "pre-processing and post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.529, "r_y0": 107.93899999999996, "r_x1": 545.115, "r_y1": 107.93899999999996, "r_x2": 545.115, "r_y2": 99.38699999999994, "r_x3": 477.529, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "Note that we do", "orig": "Note that we do", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 119.894, "r_x1": 545.115, "r_y1": 119.894, "r_x2": 545.115, "r_y2": 111.34199999999998, "r_x3": 308.862, "r_y3": 111.34199999999998, "coord_origin": "TOPLEFT"}, "text": "not have post-processing results for SynthTabNet as images", "orig": "not have post-processing results for SynthTabNet as images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 131.84900000000005, "r_x1": 545.115, "r_y1": 131.84900000000005, "r_x2": 545.115, "r_y2": 123.29700000000003, "r_x3": 308.862, "r_y3": 123.29700000000003, "coord_origin": "TOPLEFT"}, "text": "are only provided. To compare the performance of our pro-", "orig": "are only provided. To compare the performance of our pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 143.80499999999995, "r_x1": 502.017, "r_y1": 143.80499999999995, "r_x2": 502.017, "r_y2": 135.25300000000004, "r_x3": 308.862, "r_y3": 135.25300000000004, "coord_origin": "TOPLEFT"}, "text": "posed approach, we've integrated TableFormer's", "orig": "posed approach, we've integrated TableFormer's", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 504.473, "r_y0": 143.66200000000003, "r_x1": 545.11, "r_y1": 143.66200000000003, "r_x2": 545.11, "r_y2": 135.07399999999996, "r_x3": 504.473, "r_y3": 135.07399999999996, "coord_origin": "TOPLEFT"}, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 155.61699999999996, "r_x1": 343.163, "r_y1": 155.61699999999996, "r_x2": 343.163, "r_y2": 147.029, "r_x3": 308.862, "r_y3": 147.029, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.371, "r_y0": 155.76, "r_x1": 437.818, "r_y1": 155.76, "r_x2": 437.818, "r_y2": 147.20799999999997, "r_x3": 346.371, "r_y3": 147.20799999999997, "coord_origin": "TOPLEFT"}, "text": "into EDD architecture.", "orig": "into EDD architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.371, "r_y0": 155.76, "r_x1": 545.115, "r_y1": 155.76, "r_x2": 545.115, "r_y2": 147.20799999999997, "r_x3": 442.371, "r_y3": 147.20799999999997, "coord_origin": "TOPLEFT"}, "text": "As mentioned previously,", "orig": "As mentioned previously,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 167.71500000000003, "r_x1": 446.157, "r_y1": 167.71500000000003, "r_x2": 446.157, "r_y2": 159.163, "r_x3": 308.862, "r_y3": 159.163, "coord_origin": "TOPLEFT"}, "text": "the Structure Decoder provides the", "orig": "the Structure Decoder provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.29, "r_y0": 167.572, "r_x1": 525.042, "r_y1": 167.572, "r_x2": 525.042, "r_y2": 158.98400000000004, "r_x3": 448.29, "r_y3": 158.98400000000004, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 527.399, "r_y0": 167.71500000000003, "r_x1": 545.113, "r_y1": 167.71500000000003, "r_x2": 545.113, "r_y2": 159.163, "r_x3": 527.399, "r_y3": 159.163, "coord_origin": "TOPLEFT"}, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 179.66999999999996, "r_x1": 545.115, "r_y1": 179.66999999999996, "r_x2": 545.115, "r_y2": 171.11800000000005, "r_x3": 308.862, "r_y3": 171.11800000000005, "coord_origin": "TOPLEFT"}, "text": "the features needed to predict the bounding box predictions.", "orig": "the features needed to predict the bounding box predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 191.625, "r_x1": 432.866, "r_y1": 191.625, "r_x2": 432.866, "r_y2": 183.07299999999998, "r_x3": 308.862, "r_y3": 183.07299999999998, "coord_origin": "TOPLEFT"}, "text": "Therefore, the accuracy of the", "orig": "Therefore, the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.39, "r_y0": 191.48199999999997, "r_x1": 510.93, "r_y1": 191.48199999999997, "r_x2": 510.93, "r_y2": 182.894, "r_x3": 436.39, "r_y3": 182.894, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 514.677, "r_y0": 191.625, "r_x1": 545.113, "r_y1": 191.625, "r_x2": 545.113, "r_y2": 183.07299999999998, "r_x3": 514.677, "r_y3": 183.07299999999998, "coord_origin": "TOPLEFT"}, "text": "directly", "orig": "directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 203.58000000000004, "r_x1": 431.173, "r_y1": 203.58000000000004, "r_x2": 431.173, "r_y2": 195.02800000000002, "r_x3": 308.862, "r_y3": 195.02800000000002, "coord_origin": "TOPLEFT"}, "text": "influences the accuracy of the", "orig": "influences the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 434.679, "r_y0": 203.437, "r_x1": 514.181, "r_y1": 203.437, "r_x2": 514.181, "r_y2": 194.84900000000005, "r_x3": 434.679, "r_y3": 194.84900000000005, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 514.176, "r_y0": 203.58000000000004, "r_x1": 516.667, "r_y1": 203.58000000000004, "r_x2": 516.667, "r_y2": 195.02800000000002, "r_x3": 514.176, "r_y3": 195.02800000000002, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 522.794, "r_y0": 203.58000000000004, "r_x1": 529.429, "r_y1": 203.58000000000004, "r_x2": 529.429, "r_y2": 195.02800000000002, "r_x3": 522.794, "r_y3": 195.02800000000002, "coord_origin": "TOPLEFT"}, "text": "If", "orig": "If", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.936, "r_y0": 203.58000000000004, "r_x1": 545.11, "r_y1": 203.58000000000004, "r_x2": 545.11, "r_y2": 195.02800000000002, "r_x3": 532.936, "r_y3": 195.02800000000002, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 215.39300000000003, "r_x1": 382.356, "r_y1": 215.39300000000003, "r_x2": 382.356, "r_y2": 206.80499999999995, "r_x3": 308.862, "r_y3": 206.80499999999995, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.075, "r_y0": 215.53599999999994, "r_x1": 545.114, "r_y1": 215.53599999999994, "r_x2": 545.114, "r_y2": 206.98400000000004, "r_x3": 385.075, "r_y3": 206.98400000000004, "coord_origin": "TOPLEFT"}, "text": "predicts an extra column, this will result", "orig": "predicts an extra column, this will result", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 227.49099999999999, "r_x1": 501.698, "r_y1": 227.49099999999999, "r_x2": 501.698, "r_y2": 218.93899999999996, "r_x3": 308.862, "r_y3": 218.93899999999996, "coord_origin": "TOPLEFT"}, "text": "in an extra column of predicted bounding boxes.", "orig": "in an extra column of predicted bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.323, "r_y0": 262.485, "r_x1": 365.335, "r_y1": 262.485, "r_x2": 365.335, "r_y2": 253.933, "r_x3": 339.323, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.041, "r_y0": 262.485, "r_x1": 430.919, "r_y1": 262.485, "r_x2": 430.919, "r_y2": 253.933, "r_x3": 401.041, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.102, "r_y0": 262.485, "r_x1": 474.585, "r_y1": 262.485, "r_x2": 474.585, "r_y2": 253.933, "r_x3": 454.102, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 486.54, "r_y0": 262.485, "r_x1": 527.228, "r_y1": 262.485, "r_x2": 527.228, "r_y2": 253.933, "r_x3": 486.54, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.656, "r_y0": 279.442, "r_x1": 377.001, "r_y1": 279.442, "r_x2": 377.001, "r_y2": 270.89, "r_x3": 327.656, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.698, "r_y0": 279.442, "r_x1": 438.281, "r_y1": 279.442, "r_x2": 438.281, "r_y2": 270.89, "r_x3": 393.698, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.636, "r_y0": 279.442, "r_x1": 473.07, "r_y1": 279.442, "r_x2": 473.07, "r_y2": 270.89, "r_x3": 455.636, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.166, "r_y0": 279.442, "r_x1": 515.6, "r_y1": 279.442, "r_x2": 515.6, "r_y2": 270.89, "r_x3": 498.166, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 291.397, "r_x1": 377.863, "r_y1": 291.397, "r_x2": 377.863, "r_y2": 282.845, "r_x3": 326.795, "r_y3": 282.845, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.694, "r_y0": 291.397, "r_x1": 438.276, "r_y1": 291.397, "r_x2": 438.276, "r_y2": 282.845, "r_x3": 393.694, "r_y3": 282.845, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.631, "r_y0": 291.413, "r_x1": 473.066, "r_y1": 291.413, "r_x2": 473.066, "r_y2": 282.457, "r_x3": 455.631, "r_y3": 282.457, "coord_origin": "TOPLEFT"}, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.171, "r_y0": 291.413, "r_x1": 515.606, "r_y1": 291.413, "r_x2": 515.606, "r_y2": 282.457, "r_x3": 498.171, "r_y3": 282.457, "coord_origin": "TOPLEFT"}, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 303.352, "r_x1": 377.863, "r_y1": 303.352, "r_x2": 377.863, "r_y2": 294.8, "r_x3": 326.795, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 389.818, "r_y0": 303.352, "r_x1": 442.152, "r_y1": 303.352, "r_x2": 442.152, "r_y2": 294.8, "r_x3": 389.818, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.631, "r_y0": 303.352, "r_x1": 473.066, "r_y1": 303.352, "r_x2": 473.066, "r_y2": 294.8, "r_x3": 455.631, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 505.225, "r_y0": 303.352, "r_x1": 508.543, "r_y1": 303.352, "r_x2": 508.543, "r_y2": 294.8, "r_x3": 505.225, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 325.27, "r_x1": 341.499, "r_y1": 325.27, "r_x2": 341.499, "r_y2": 316.718, "r_x3": 308.862, "r_y3": 316.718, "coord_origin": "TOPLEFT"}, "text": "Table 3:", "orig": "Table 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.603, "r_y0": 325.27, "r_x1": 545.115, "r_y1": 325.27, "r_x2": 545.115, "r_y2": 316.718, "r_x3": 348.603, "r_y3": 316.718, "coord_origin": "TOPLEFT"}, "text": "Cell Bounding Box detection results on PubTab-", "orig": "Cell Bounding Box detection results on PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 337.225, "r_x1": 474.978, "r_y1": 337.225, "r_x2": 474.978, "r_y2": 328.673, "r_x3": 308.862, "r_y3": 328.673, "coord_origin": "TOPLEFT"}, "text": "Net, and FinTabNet. PP: Post-processing.", "orig": "Net, and FinTabNet. PP: Post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 376.636, "r_x1": 378.949, "r_y1": 376.636, "r_x2": 378.949, "r_y2": 367.68, "r_x3": 320.817, "r_y3": 367.68, "coord_origin": "TOPLEFT"}, "text": "Cell Content.", "orig": "Cell Content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 387.079, "r_y0": 376.62, "r_x1": 395.378, "r_y1": 376.62, "r_x2": 395.378, "r_y2": 368.068, "r_x3": 387.079, "r_y3": 368.068, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 399.552, "r_y0": 376.62, "r_x1": 413.948, "r_y1": 376.62, "r_x2": 413.948, "r_y2": 368.068, "r_x3": 399.552, "r_y3": 368.068, "coord_origin": "TOPLEFT"}, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.112, "r_y0": 376.62, "r_x1": 448.827, "r_y1": 376.62, "r_x2": 448.827, "r_y2": 368.068, "r_x3": 418.112, "r_y3": 368.068, "coord_origin": "TOPLEFT"}, "text": "section,", "orig": "section,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.42, "r_y0": 376.62, "r_x1": 545.116, "r_y1": 376.62, "r_x2": 545.116, "r_y2": 368.068, "r_x3": 453.42, "r_y3": 368.068, "coord_origin": "TOPLEFT"}, "text": "we evaluate the entire", "orig": "we evaluate the entire", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 388.575, "r_x1": 487.193, "r_y1": 388.575, "r_x2": 487.193, "r_y2": 380.023, "r_x3": 308.862, "r_y3": 380.023, "coord_origin": "TOPLEFT"}, "text": "pipeline of recovering a table with content.", "orig": "pipeline of recovering a table with content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.967, "r_y0": 388.575, "r_x1": 545.115, "r_y1": 388.575, "r_x2": 545.115, "r_y2": 380.023, "r_x3": 493.967, "r_y3": 380.023, "coord_origin": "TOPLEFT"}, "text": "Here we put", "orig": "Here we put", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 400.53, "r_x1": 545.115, "r_y1": 400.53, "r_x2": 545.115, "r_y2": 391.978, "r_x3": 308.862, "r_y3": 391.978, "coord_origin": "TOPLEFT"}, "text": "our approach to test by capitalizing on extracting content", "orig": "our approach to test by capitalizing on extracting content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 412.486, "r_x1": 545.115, "r_y1": 412.486, "r_x2": 545.115, "r_y2": 403.934, "r_x3": 308.862, "r_y3": 403.934, "coord_origin": "TOPLEFT"}, "text": "from the PDF cells rather than decoding from images. Tab.", "orig": "from the PDF cells rather than decoding from images. Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 424.441, "r_x1": 545.115, "r_y1": 424.441, "r_x2": 545.115, "r_y2": 415.889, "r_x3": 308.862, "r_y3": 415.889, "coord_origin": "TOPLEFT"}, "text": "4 shows the TEDs score of HTML code representing the", "orig": "4 shows the TEDs score of HTML code representing the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 436.396, "r_x1": 545.115, "r_y1": 436.396, "r_x2": 545.115, "r_y2": 427.844, "r_x3": 308.862, "r_y3": 427.844, "coord_origin": "TOPLEFT"}, "text": "structure of the table along with the content inserted in the", "orig": "structure of the table along with the content inserted in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 203, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 448.351, "r_x1": 545.115, "r_y1": 448.351, "r_x2": 545.115, "r_y2": 439.799, "r_x3": 308.862, "r_y3": 439.799, "coord_origin": "TOPLEFT"}, "text": "data cell and compared with the ground-truth. Our method", "orig": "data cell and compared with the ground-truth. Our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 204, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 460.306, "r_x1": 350.237, "r_y1": 460.306, "r_x2": 350.237, "r_y2": 451.754, "r_x3": 308.862, "r_y3": 451.754, "coord_origin": "TOPLEFT"}, "text": "achieved a", "orig": "achieved a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 205, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 352.176, "r_y0": 460.322, "r_x1": 374.592, "r_y1": 460.322, "r_x2": 374.592, "r_y2": 451.366, "r_x3": 352.176, "r_y3": 451.366, "coord_origin": "TOPLEFT"}, "text": "5.3%", "orig": "5.3%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 206, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.533, "r_y0": 460.306, "r_x1": 545.11, "r_y1": 460.306, "r_x2": 545.11, "r_y2": 451.754, "r_x3": 376.533, "r_y3": 451.754, "coord_origin": "TOPLEFT"}, "text": "increase over the state-of-the-art, and com-", "orig": "increase over the state-of-the-art, and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 207, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 472.261, "r_x1": 380.523, "r_y1": 472.261, "r_x2": 380.523, "r_y2": 463.709, "r_x3": 308.862, "r_y3": 463.709, "coord_origin": "TOPLEFT"}, "text": "mercial solutions.", "orig": "mercial solutions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 208, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.042, "r_y0": 472.261, "r_x1": 545.115, "r_y1": 472.261, "r_x2": 545.115, "r_y2": 463.709, "r_x3": 386.042, "r_y3": 463.709, "coord_origin": "TOPLEFT"}, "text": "We believe our scores would be higher", "orig": "We believe our scores would be higher", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 209, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 484.217, "r_x1": 314.949, "r_y1": 484.217, "r_x2": 314.949, "r_y2": 475.665, "r_x3": 308.862, "r_y3": 475.665, "coord_origin": "TOPLEFT"}, "text": "if", "orig": "if", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 210, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.008, "r_y0": 484.217, "r_x1": 545.115, "r_y1": 484.217, "r_x2": 545.115, "r_y2": 475.665, "r_x3": 318.008, "r_y3": 475.665, "coord_origin": "TOPLEFT"}, "text": "the HTML ground-truth matched the extracted PDF cell", "orig": "the HTML ground-truth matched the extracted PDF cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 211, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 496.172, "r_x1": 340.683, "r_y1": 496.172, "r_x2": 340.683, "r_y2": 487.62, "r_x3": 308.862, "r_y3": 487.62, "coord_origin": "TOPLEFT"}, "text": "content.", "orig": "content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 212, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.793, "r_y0": 496.172, "r_x1": 545.115, "r_y1": 496.172, "r_x2": 545.115, "r_y2": 487.62, "r_x3": 345.793, "r_y3": 487.62, "coord_origin": "TOPLEFT"}, "text": "Unfortunately, there are small discrepancies such", "orig": "Unfortunately, there are small discrepancies such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 213, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 508.127, "r_x1": 545.115, "r_y1": 508.127, "r_x2": 545.115, "r_y2": 499.575, "r_x3": 308.862, "r_y3": 499.575, "coord_origin": "TOPLEFT"}, "text": "as spacings around words or special characters with various", "orig": "as spacings around words or special characters with various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 214, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 520.082, "r_x1": 405.698, "r_y1": 520.082, "r_x2": 405.698, "r_y2": 511.53, "r_x3": 308.862, "r_y3": 511.53, "coord_origin": "TOPLEFT"}, "text": "unicode representations.", "orig": "unicode representations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 215, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 358.011, "r_y0": 561.054, "r_x1": 384.023, "r_y1": 561.054, "r_x2": 384.023, "r_y2": 552.502, "r_x3": 358.011, "r_y3": 552.502, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 216, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.034, "r_y0": 555.076, "r_x1": 473.94, "r_y1": 555.076, "r_x2": 473.94, "r_y2": 546.524, "r_x3": 449.034, "r_y3": 546.524, "coord_origin": "TOPLEFT"}, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 217, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.506, "r_y0": 567.031, "r_x1": 436.74, "r_y1": 567.031, "r_x2": 436.74, "r_y2": 558.479, "r_x3": 408.506, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 218, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.695, "r_y0": 567.031, "r_x1": 485.079, "r_y1": 567.031, "r_x2": 485.079, "r_y2": 558.479, "r_x3": 448.695, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 219, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 499.385, "r_y0": 567.031, "r_x1": 512.117, "r_y1": 567.031, "r_x2": 512.117, "r_y2": 558.479, "r_x3": 499.385, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 220, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.682, "r_y0": 583.988, "r_x1": 384.352, "r_y1": 583.988, "r_x2": 384.352, "r_y2": 575.436, "r_x3": 357.682, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 221, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.901, "r_y0": 583.988, "r_x1": 431.336, "r_y1": 583.988, "r_x2": 431.336, "r_y2": 575.436, "r_x3": 413.901, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 222, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 583.988, "r_x1": 475.599, "r_y1": 583.988, "r_x2": 475.599, "r_y2": 575.436, "r_x3": 458.165, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 223, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.029, "r_y0": 583.988, "r_x1": 514.463, "r_y1": 583.988, "r_x2": 514.463, "r_y2": 575.436, "r_x3": 497.029, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 224, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 350.723, "r_y0": 595.943, "r_x1": 391.311, "r_y1": 595.943, "r_x2": 391.311, "r_y2": 587.391, "r_x3": 350.723, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 225, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 595.943, "r_x1": 431.34, "r_y1": 595.943, "r_x2": 431.34, "r_y2": 587.391, "r_x3": 413.906, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 226, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 595.943, "r_x1": 475.604, "r_y1": 595.943, "r_x2": 475.604, "r_y2": 587.391, "r_x3": 458.17, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 227, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 595.943, "r_x1": 514.468, "r_y1": 595.943, "r_x2": 514.468, "r_y2": 587.391, "r_x3": 497.034, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 228, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.136, "r_y0": 607.899, "r_x1": 387.899, "r_y1": 607.899, "r_x2": 387.899, "r_y2": 599.347, "r_x3": 354.136, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 229, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.902, "r_y0": 607.899, "r_x1": 431.336, "r_y1": 607.899, "r_x2": 431.336, "r_y2": 599.347, "r_x3": 413.902, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 230, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 607.899, "r_x1": 475.6, "r_y1": 607.899, "r_x2": 475.6, "r_y2": 599.347, "r_x3": 458.165, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 231, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.03, "r_y0": 607.899, "r_x1": 514.464, "r_y1": 607.899, "r_x2": 514.464, "r_y2": 599.347, "r_x3": 497.03, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 232, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.559, "r_y0": 619.854, "r_x1": 395.475, "r_y1": 619.854, "r_x2": 395.475, "r_y2": 611.302, "r_x3": 346.559, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 233, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 619.854, "r_x1": 431.341, "r_y1": 619.854, "r_x2": 431.341, "r_y2": 611.302, "r_x3": 413.906, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 234, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 619.854, "r_x1": 475.605, "r_y1": 619.854, "r_x2": 475.605, "r_y2": 611.302, "r_x3": 458.17, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 235, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 619.854, "r_x1": 514.469, "r_y1": 619.854, "r_x2": 514.469, "r_y2": 611.302, "r_x3": 497.034, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 236, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.781, "r_y0": 631.809, "r_x1": 381.254, "r_y1": 631.809, "r_x2": 381.254, "r_y2": 623.2570000000001, "r_x3": 360.781, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 237, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.902, "r_y0": 631.809, "r_x1": 431.336, "r_y1": 631.809, "r_x2": 431.336, "r_y2": 623.2570000000001, "r_x3": 413.902, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 238, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 631.809, "r_x1": 475.6, "r_y1": 631.809, "r_x2": 475.6, "r_y2": 623.2570000000001, "r_x3": 458.165, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 239, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.03, "r_y0": 631.809, "r_x1": 514.464, "r_y1": 631.809, "r_x2": 514.464, "r_y2": 623.2570000000001, "r_x3": 497.03, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 240, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.483, "r_y0": 643.764, "r_x1": 396.551, "r_y1": 643.764, "r_x2": 396.551, "r_y2": 635.212, "r_x3": 345.483, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 241, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 643.764, "r_x1": 431.341, "r_y1": 643.764, "r_x2": 431.341, "r_y2": 635.212, "r_x3": 413.906, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 242, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 643.764, "r_x1": 475.605, "r_y1": 643.764, "r_x2": 475.605, "r_y2": 635.212, "r_x3": 458.17, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 243, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 643.78, "r_x1": 514.469, "r_y1": 643.78, "r_x2": 514.469, "r_y2": 634.8240000000001, "r_x3": 497.034, "r_y3": 634.8240000000001, "coord_origin": "TOPLEFT"}, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 244, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 665.682, "r_x1": 341.739, "r_y1": 665.682, "r_x2": 341.739, "r_y2": 657.13, "r_x3": 308.862, "r_y3": 657.13, "coord_origin": "TOPLEFT"}, "text": "Table 4:", "orig": "Table 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 245, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 349.559, "r_y0": 665.682, "r_x1": 545.115, "r_y1": 665.682, "r_x2": 545.115, "r_y2": 657.13, "r_x3": 349.559, "r_y3": 657.13, "coord_origin": "TOPLEFT"}, "text": "Results of structure with content retrieved using", "orig": "Results of structure with content retrieved using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 246, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 677.637, "r_x1": 425.763, "r_y1": 677.637, "r_x2": 425.763, "r_y2": 669.085, "r_x3": 308.862, "r_y3": 669.085, "coord_origin": "TOPLEFT"}, "text": "cell detection on PubTabNet.", "orig": "cell detection on PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 247, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.336, "r_y0": 677.637, "r_x1": 545.115, "r_y1": 677.637, "r_x2": 545.115, "r_y2": 669.085, "r_x3": 430.336, "r_y3": 669.085, "coord_origin": "TOPLEFT"}, "text": "In all cases the input is PDF", "orig": "In all cases the input is PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 248, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.592, "r_x1": 435.038, "r_y1": 689.592, "r_x2": 435.038, "r_y2": 681.04, "r_x3": 308.862, "r_y3": 681.04, "coord_origin": "TOPLEFT"}, "text": "documents with cropped tables.", "orig": "documents with cropped tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 249, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 10, "label": "section_header", "bbox": {"l": 50.112, "t": 74.40099999999995, "r": 167.898, "b": 84.25300000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9554274082183838, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.25300000000004, "r_x1": 167.898, "r_y1": 84.25300000000004, "r_x2": 167.898, "r_y2": 74.40099999999995, "r_x3": 50.112, "r_y3": 74.40099999999995, "coord_origin": "TOPLEFT"}, "text": "5.3. Datasets and Metrics", "orig": "5.3. Datasets and Metrics", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 50.112, "t": 93.61900000000003, "r": 286.365, "b": 138.03700000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.9862998127937317, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 102.17100000000005, "r_x1": 286.365, "r_y1": 102.17100000000005, "r_x2": 286.365, "r_y2": 93.61900000000003, "r_x3": 62.067, "r_y3": 93.61900000000003, "coord_origin": "TOPLEFT"}, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 114.12599999999998, "r_x1": 286.365, "r_y1": 114.12599999999998, "r_x2": 286.365, "r_y2": 105.57399999999996, "r_x3": 50.112, "r_y3": 105.57399999999996, "coord_origin": "TOPLEFT"}, "text": "ric was introduced in [37]. It represents the prediction, and", "orig": "ric was introduced in [37]. It represents the prediction, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 126.08100000000002, "r_x1": 239.999, "r_y1": 126.08100000000002, "r_x2": 239.999, "r_y2": 117.529, "r_x3": 50.112, "r_y3": 117.529, "coord_origin": "TOPLEFT"}, "text": "ground-truth as a tree structure of HTML tags.", "orig": "ground-truth as a tree structure of HTML tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.03, "r_y0": 126.08100000000002, "r_x1": 286.365, "r_y1": 126.08100000000002, "r_x2": 286.365, "r_y2": 117.529, "r_x3": 245.03, "r_y3": 117.529, "coord_origin": "TOPLEFT"}, "text": "This simi-", "orig": "This simi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 138.03700000000003, "r_x1": 136.717, "r_y1": 138.03700000000003, "r_x2": 136.717, "r_y2": 129.485, "r_x3": 50.112, "r_y3": 129.485, "coord_origin": "TOPLEFT"}, "text": "larity is calculated as:", "orig": "larity is calculated as:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "formula", "bbox": {"l": 86.219, "t": 150.428, "r": 286.362, "b": 173.63199999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9500409364700317, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.219, "r_y0": 165.87400000000002, "r_x1": 118.878, "r_y1": 165.87400000000002, "r_x2": 118.878, "r_y2": 157.168, "r_x3": 86.219, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": "TEDS(", "orig": "TEDS(", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 118.875, "r_y0": 165.87400000000002, "r_x1": 139.77, "r_y1": 165.87400000000002, "r_x2": 139.77, "r_y2": 157.168, "r_x3": 118.875, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": "T , T", "orig": "T , T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.697, "r_y0": 166.798, "r_x1": 129.019, "r_y1": 166.798, "r_x2": 129.019, "r_y2": 160.70399999999995, "r_x3": 124.697, "r_y3": 160.70399999999995, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.766, "r_y0": 166.798, "r_x1": 143.27, "r_y1": 166.798, "r_x2": 143.27, "r_y2": 160.70399999999995, "r_x3": 139.766, "r_y3": 160.70399999999995, "coord_origin": "TOPLEFT"}, "text": "b", "orig": "b", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.768, "r_y0": 165.87400000000002, "r_x1": 165.902, "r_y1": 165.87400000000002, "r_x2": 165.902, "r_y2": 157.168, "r_x3": 143.768, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": ") = 1", "orig": ") = 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.121, "r_y0": 165.73199999999997, "r_x1": 175.87, "r_y1": 165.73199999999997, "r_x2": 175.87, "r_y2": 157.168, "r_x3": 168.121, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 179.279, "r_y0": 159.13400000000001, "r_x1": 221.957, "r_y1": 159.13400000000001, "r_x2": 221.957, "r_y2": 150.428, "r_x3": 179.279, "r_y3": 150.428, "coord_origin": "TOPLEFT"}, "text": "EditDist (", "orig": "EditDist (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.952, "r_y0": 159.13400000000001, "r_x1": 242.848, "r_y1": 159.13400000000001, "r_x2": 242.848, "r_y2": 150.428, "r_x3": 221.952, "r_y3": 150.428, "coord_origin": "TOPLEFT"}, "text": "T , T", "orig": "T , T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.774, "r_y0": 160.058, "r_x1": 232.096, "r_y1": 160.058, "r_x2": 232.096, "r_y2": 153.96400000000006, "r_x3": 227.774, "r_y3": 153.96400000000006, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.843, "r_y0": 160.058, "r_x1": 246.347, "r_y1": 160.058, "r_x2": 246.347, "r_y2": 153.96400000000006, "r_x3": 242.843, "r_y3": 153.96400000000006, "coord_origin": "TOPLEFT"}, "text": "b", "orig": "b", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.845, "r_y0": 159.13400000000001, "r_x1": 250.719, "r_y1": 159.13400000000001, "r_x2": 250.719, "r_y2": 150.428, "r_x3": 246.845, "r_y3": 150.428, "coord_origin": "TOPLEFT"}, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.212, "r_y0": 172.70799999999997, "r_x1": 206.292, "r_y1": 172.70799999999997, "r_x2": 206.292, "r_y2": 164.00199999999995, "r_x3": 182.212, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "max(", "orig": "max(", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.289, "r_y0": 172.56600000000003, "r_x1": 209.057, "r_y1": 172.56600000000003, "r_x2": 209.057, "r_y2": 164.00199999999995, "r_x3": 206.289, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.056, "r_y0": 172.70799999999997, "r_x1": 214.878, "r_y1": 172.70799999999997, "r_x2": 214.878, "r_y2": 164.00199999999995, "r_x3": 209.056, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.878, "r_y0": 173.63199999999995, "r_x1": 219.2, "r_y1": 173.63199999999995, "r_x2": 219.2, "r_y2": 167.538, "r_x3": 214.878, "r_y3": 167.538, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.697, "r_y0": 172.56600000000003, "r_x1": 222.465, "r_y1": 172.56600000000003, "r_x2": 222.465, "r_y2": 164.00199999999995, "r_x3": 219.697, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.125, "r_y0": 172.70799999999997, "r_x1": 226.893, "r_y1": 172.70799999999997, "r_x2": 226.893, "r_y2": 164.00199999999995, "r_x3": 224.125, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.553, "r_y0": 172.56600000000003, "r_x1": 231.321, "r_y1": 172.56600000000003, "r_x2": 231.321, "r_y2": 164.00199999999995, "r_x3": 228.553, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 231.32, "r_y0": 172.70799999999997, "r_x1": 237.142, "r_y1": 172.70799999999997, "r_x2": 237.142, "r_y2": 164.00199999999995, "r_x3": 231.32, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 237.142, "r_y0": 173.63199999999995, "r_x1": 240.646, "r_y1": 173.63199999999995, "r_x2": 240.646, "r_y2": 167.538, "r_x3": 237.142, "r_y3": 167.538, "coord_origin": "TOPLEFT"}, "text": "b", "orig": "b", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.144, "r_y0": 172.56600000000003, "r_x1": 243.912, "r_y1": 172.56600000000003, "r_x2": 243.912, "r_y2": 164.00199999999995, "r_x3": 241.144, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.911, "r_y0": 172.70799999999997, "r_x1": 247.785, "r_y1": 172.70799999999997, "r_x2": 247.785, "r_y2": 164.00199999999995, "r_x3": 243.911, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.746, "r_y0": 166.038, "r_x1": 286.362, "r_y1": 166.038, "r_x2": 286.362, "r_y2": 157.486, "r_x3": 274.746, "r_y3": 157.486, "coord_origin": "TOPLEFT"}, "text": "(3)", "orig": "(3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "text", "bbox": {"l": 50.112, "t": 181.11300000000006, "r": 286.363, "b": 213.89300000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.9735319018363953, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 189.98299999999995, "r_x1": 86.406, "r_y1": 189.98299999999995, "r_x2": 86.406, "r_y2": 181.43100000000004, "r_x3": 62.067, "r_y3": 181.43100000000004, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.581, "r_y0": 189.81899999999996, "r_x1": 94.403, "r_y1": 189.81899999999996, "r_x2": 94.403, "r_y2": 181.11300000000006, "r_x3": 88.581, "r_y3": 181.11300000000006, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.403, "r_y0": 190.74199999999996, "r_x1": 98.725, "r_y1": 190.74199999999996, "r_x2": 98.725, "r_y2": 184.64800000000002, "r_x3": 94.403, "r_y3": 184.64800000000002, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.399, "r_y0": 189.98299999999995, "r_x1": 115.785, "r_y1": 189.98299999999995, "r_x2": 115.785, "r_y2": 181.43100000000004, "r_x3": 101.399, "r_y3": 181.43100000000004, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 117.961, "r_y0": 189.81899999999996, "r_x1": 123.783, "r_y1": 189.81899999999996, "r_x2": 123.783, "r_y2": 181.11300000000006, "r_x3": 117.961, "r_y3": 181.11300000000006, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 123.783, "r_y0": 190.74199999999996, "r_x1": 127.287, "r_y1": 190.74199999999996, "r_x2": 127.287, "r_y2": 184.64800000000002, "r_x3": 123.783, "r_y3": 184.64800000000002, "coord_origin": "TOPLEFT"}, "text": "b", "orig": "b", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.96, "r_y0": 189.98299999999995, "r_x1": 286.363, "r_y1": 189.98299999999995, "r_x2": 286.363, "r_y2": 181.43100000000004, "r_x3": 129.96, "r_y3": 181.43100000000004, "coord_origin": "TOPLEFT"}, "text": "represent tables in tree structure HTML", "orig": "represent tables in tree structure HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 201.938, "r_x1": 252.781, "r_y1": 201.938, "r_x2": 252.781, "r_y2": 193.38599999999997, "r_x3": 50.112, "r_y3": 193.38599999999997, "coord_origin": "TOPLEFT"}, "text": "format. EditDist denotes the tree-edit distance, and", "orig": "format. EditDist denotes the tree-edit distance, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.182, "r_y0": 201.63199999999995, "r_x1": 257.95, "r_y1": 201.63199999999995, "r_x2": 257.95, "r_y2": 193.06799999999998, "r_x3": 255.182, "r_y3": 193.06799999999998, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.949, "r_y0": 201.774, "r_x1": 263.771, "r_y1": 201.774, "r_x2": 263.771, "r_y2": 193.06799999999998, "r_x3": 257.949, "r_y3": 193.06799999999998, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.155, "r_y0": 201.63199999999995, "r_x1": 267.923, "r_y1": 201.63199999999995, "r_x2": 267.923, "r_y2": 193.06799999999998, "r_x3": 265.155, "r_y3": 193.06799999999998, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.322, "r_y0": 201.938, "r_x1": 286.362, "r_y1": 201.938, "r_x2": 286.362, "r_y2": 193.38599999999997, "r_x3": 270.322, "r_y3": 193.38599999999997, "coord_origin": "TOPLEFT"}, "text": "rep-", "orig": "rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 213.89300000000003, "r_x1": 172.134, "r_y1": 213.89300000000003, "r_x2": 172.134, "r_y2": 205.341, "r_x3": 50.112, "r_y3": 205.341, "coord_origin": "TOPLEFT"}, "text": "resents the number of nodes in", "orig": "resents the number of nodes in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 174.624, "r_y0": 213.72900000000004, "r_x1": 180.446, "r_y1": 213.72900000000004, "r_x2": 180.446, "r_y2": 205.02300000000002, "r_x3": 174.624, "r_y3": 205.02300000000002, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.829, "r_y0": 213.89300000000003, "r_x1": 184.32, "r_y1": 213.89300000000003, "r_x2": 184.32, "r_y2": 205.341, "r_x3": 181.829, "r_y3": 205.341, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "section_header", "bbox": {"l": 50.112, "t": 224.81899999999996, "r": 170.452, "b": 234.67100000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9588837027549744, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 234.67100000000005, "r_x1": 170.452, "r_y1": 234.67100000000005, "r_x2": 170.452, "r_y2": 224.81899999999996, "r_x3": 50.112, "r_y3": 224.81899999999996, "coord_origin": "TOPLEFT"}, "text": "5.4. Quantitative Analysis", "orig": "5.4. Quantitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 50.112, "t": 243.64999999999998, "r": 286.365, "b": 396.052, "coord_origin": "TOPLEFT"}, "confidence": 0.9855090975761414, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 252.606, "r_x1": 105.325, "r_y1": 252.606, "r_x2": 105.325, "r_y2": 243.64999999999998, "r_x3": 62.067, "r_y3": 243.64999999999998, "coord_origin": "TOPLEFT"}, "text": "Structure.", "orig": "Structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.126, "r_y0": 252.59000000000003, "r_x1": 184.684, "r_y1": 252.59000000000003, "r_x2": 184.684, "r_y2": 244.038, "r_x3": 112.126, "r_y3": 244.038, "coord_origin": "TOPLEFT"}, "text": "As shown in Tab.", "orig": "As shown in Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 191.478, "r_y0": 252.59000000000003, "r_x1": 198.95, "r_y1": 252.59000000000003, "r_x2": 198.95, "r_y2": 244.038, "r_x3": 191.478, "r_y3": 244.038, "coord_origin": "TOPLEFT"}, "text": "2,", "orig": "2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 202.995, "r_y0": 252.59000000000003, "r_x1": 286.362, "r_y1": 252.59000000000003, "r_x2": 286.362, "r_y2": 244.038, "r_x3": 202.995, "r_y3": 244.038, "coord_origin": "TOPLEFT"}, "text": "TableFormer outper-", "orig": "TableFormer outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 264.54499999999996, "r_x1": 286.365, "r_y1": 264.54499999999996, "r_x2": 286.365, "r_y2": 255.99300000000005, "r_x3": 50.112, "r_y3": 255.99300000000005, "coord_origin": "TOPLEFT"}, "text": "forms all SOTA methods across different datasets by a large", "orig": "forms all SOTA methods across different datasets by a large", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 276.5, "r_x1": 138.719, "r_y1": 276.5, "r_x2": 138.719, "r_y2": 267.948, "r_x3": 50.112, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "margin for predicting", "orig": "margin for predicting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.993, "r_y0": 276.5, "r_x1": 155.168, "r_y1": 276.5, "r_x2": 155.168, "r_y2": 267.948, "r_x3": 142.993, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.432, "r_y0": 276.5, "r_x1": 178.799, "r_y1": 276.5, "r_x2": 178.799, "r_y2": 267.948, "r_x3": 159.432, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.073, "r_y0": 276.5, "r_x1": 217.932, "r_y1": 276.5, "r_x2": 217.932, "r_y2": 267.948, "r_x3": 183.073, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.206, "r_y0": 276.5, "r_x1": 286.365, "r_y1": 276.5, "r_x2": 286.365, "r_y2": 267.948, "r_x3": 222.206, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "from an image.", "orig": "from an image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 288.455, "r_x1": 286.365, "r_y1": 288.455, "r_x2": 286.365, "r_y2": 279.903, "r_x3": 50.112, "r_y3": 279.903, "coord_origin": "TOPLEFT"}, "text": "All the more, our model outperforms pre-trained methods.", "orig": "All the more, our model outperforms pre-trained methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 300.411, "r_x1": 286.365, "r_y1": 300.411, "r_x2": 286.365, "r_y2": 291.859, "r_x3": 50.112, "r_y3": 291.859, "coord_origin": "TOPLEFT"}, "text": "During the evaluation we do not apply any table filtering.", "orig": "During the evaluation we do not apply any table filtering.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 312.366, "r_x1": 286.365, "r_y1": 312.366, "r_x2": 286.365, "r_y2": 303.814, "r_x3": 50.112, "r_y3": 303.814, "coord_origin": "TOPLEFT"}, "text": "We also provide our baseline results on the SynthTabNet", "orig": "We also provide our baseline results on the SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 324.321, "r_x1": 80.269, "r_y1": 324.321, "r_x2": 80.269, "r_y2": 315.769, "r_x3": 50.112, "r_y3": 315.769, "coord_origin": "TOPLEFT"}, "text": "dataset.", "orig": "dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.579, "r_y0": 324.321, "r_x1": 91.666, "r_y1": 324.321, "r_x2": 91.666, "r_y2": 315.769, "r_x3": 85.579, "r_y3": 315.769, "coord_origin": "TOPLEFT"}, "text": "It", "orig": "It", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.894, "r_y0": 324.321, "r_x1": 257.812, "r_y1": 324.321, "r_x2": 257.812, "r_y2": 315.769, "r_x3": 94.894, "r_y3": 315.769, "coord_origin": "TOPLEFT"}, "text": "has been observed that large tables (e.g.", "orig": "has been observed that large tables (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.122, "r_y0": 324.321, "r_x1": 286.365, "r_y1": 324.321, "r_x2": 286.365, "r_y2": 315.769, "r_x3": 263.122, "r_y3": 315.769, "coord_origin": "TOPLEFT"}, "text": "tables", "orig": "tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 336.276, "r_x1": 286.365, "r_y1": 336.276, "r_x2": 286.365, "r_y2": 327.724, "r_x3": 50.112, "r_y3": 327.724, "coord_origin": "TOPLEFT"}, "text": "that occupy half of the page or more) yield poor predictions.", "orig": "that occupy half of the page or more) yield poor predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 348.231, "r_x1": 286.365, "r_y1": 348.231, "r_x2": 286.365, "r_y2": 339.679, "r_x3": 50.112, "r_y3": 339.679, "coord_origin": "TOPLEFT"}, "text": "We attribute this issue to the image resizing during the pre-", "orig": "We attribute this issue to the image resizing during the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 360.186, "r_x1": 115.068, "r_y1": 360.186, "r_x2": 115.068, "r_y2": 351.634, "r_x3": 50.112, "r_y3": 351.634, "coord_origin": "TOPLEFT"}, "text": "processing step,", "orig": "processing step,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.203, "r_y0": 360.186, "r_x1": 134.147, "r_y1": 360.186, "r_x2": 134.147, "r_y2": 351.634, "r_x3": 119.203, "r_y3": 351.634, "coord_origin": "TOPLEFT"}, "text": "that", "orig": "that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.952, "r_y0": 360.186, "r_x1": 286.365, "r_y1": 360.186, "r_x2": 286.365, "r_y2": 351.634, "r_x3": 137.952, "r_y3": 351.634, "coord_origin": "TOPLEFT"}, "text": "produces downsampled images with", "orig": "produces downsampled images with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 372.142, "r_x1": 155.357, "r_y1": 372.142, "r_x2": 155.357, "r_y2": 363.59, "r_x3": 50.112, "r_y3": 363.59, "coord_origin": "TOPLEFT"}, "text": "indistinguishable features.", "orig": "indistinguishable features.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.378, "r_y0": 372.142, "r_x1": 286.365, "r_y1": 372.142, "r_x2": 286.365, "r_y2": 363.59, "r_x3": 160.378, "r_y3": 363.59, "coord_origin": "TOPLEFT"}, "text": "This problem can be addressed", "orig": "This problem can be addressed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 384.097, "r_x1": 286.365, "r_y1": 384.097, "r_x2": 286.365, "r_y2": 375.545, "r_x3": 50.112, "r_y3": 375.545, "coord_origin": "TOPLEFT"}, "text": "by treating such big tables with a separate model which ac-", "orig": "by treating such big tables with a separate model which ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 396.052, "r_x1": 170.012, "r_y1": 396.052, "r_x2": 170.012, "r_y2": 387.5, "r_x3": 50.112, "r_y3": 387.5, "coord_origin": "TOPLEFT"}, "text": "cepts a large input image size.", "orig": "cepts a large input image size.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "table", "bbox": {"l": 53.368526458740234, "t": 409.1357727050781, "r": 283.0443420410156, "b": 582.3977661132812, "coord_origin": "TOPLEFT"}, "confidence": 0.9892510175704956, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.843, "r_y0": 429.511, "r_x1": 104.855, "r_y1": 429.511, "r_x2": 104.855, "r_y2": 420.959, "r_x3": 78.843, "r_y3": 420.959, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.2, "r_y0": 423.533, "r_x1": 236.107, "r_y1": 423.533, "r_x2": 236.107, "r_y2": 414.981, "r_x3": 211.2, "r_y3": 414.981, "coord_origin": "TOPLEFT"}, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.338, "r_y0": 435.488, "r_x1": 159.216, "r_y1": 435.488, "r_x2": 159.216, "r_y2": 426.936, "r_x3": 129.338, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.171, "r_y0": 435.488, "r_x1": 199.405, "r_y1": 435.488, "r_x2": 199.405, "r_y2": 426.936, "r_x3": 171.171, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.36, "r_y0": 435.488, "r_x1": 247.744, "r_y1": 435.488, "r_x2": 247.744, "r_y2": 426.936, "r_x3": 211.36, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.54, "r_y0": 435.488, "r_x1": 277.273, "r_y1": 435.488, "r_x2": 277.273, "r_y2": 426.936, "r_x3": 264.54, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 452.445, "r_x1": 102.085, "r_y1": 452.445, "r_x2": 102.085, "r_y2": 443.893, "r_x3": 81.612, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.872, "r_y0": 452.445, "r_x1": 153.691, "r_y1": 452.445, "r_x2": 153.691, "r_y2": 443.893, "r_x3": 134.872, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 452.445, "r_x1": 194.0, "r_y1": 452.445, "r_x2": 194.0, "r_y2": 443.893, "r_x3": 176.566, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.829, "r_y0": 452.445, "r_x1": 238.264, "r_y1": 452.445, "r_x2": 238.264, "r_y2": 443.893, "r_x3": 220.829, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 452.445, "r_x1": 279.619, "r_y1": 452.445, "r_x2": 279.619, "r_y2": 443.893, "r_x3": 262.184, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.165, "r_y0": 464.401, "r_x1": 101.532, "r_y1": 464.401, "r_x2": 101.532, "r_y2": 455.849, "r_x3": 82.165, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.867, "r_y0": 464.401, "r_x1": 153.687, "r_y1": 464.401, "r_x2": 153.687, "r_y2": 455.849, "r_x3": 134.867, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.624, "r_y0": 464.401, "r_x1": 186.942, "r_y1": 464.401, "r_x2": 186.942, "r_y2": 455.849, "r_x3": 183.624, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 464.401, "r_x1": 231.205, "r_y1": 464.401, "r_x2": 231.205, "r_y2": 455.849, "r_x3": 227.888, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.699, "r_y0": 464.401, "r_x1": 282.114, "r_y1": 464.401, "r_x2": 282.114, "r_y2": 455.849, "r_x3": 259.699, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 476.954, "r_x1": 117.383, "r_y1": 476.954, "r_x2": 117.383, "r_y2": 468.402, "r_x3": 66.315, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 476.954, "r_x1": 153.687, "r_y1": 476.954, "r_x2": 153.687, "r_y2": 468.402, "r_x3": 134.868, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 476.954, "r_x1": 194.006, "r_y1": 476.954, "r_x2": 194.006, "r_y2": 468.402, "r_x3": 176.571, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 476.954, "r_x1": 238.269, "r_y1": 476.954, "r_x2": 238.269, "r_y2": 468.402, "r_x3": 220.835, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.698, "r_y0": 476.97, "r_x1": 282.114, "r_y1": 476.97, "r_x2": 282.114, "r_y2": 468.014, "r_x3": 259.698, "r_y3": 468.014, "coord_origin": "TOPLEFT"}, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 492.147, "r_x1": 102.085, "r_y1": 492.147, "r_x2": 102.085, "r_y2": 483.595, "r_x3": 81.612, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.872, "r_y0": 492.147, "r_x1": 153.691, "r_y1": 492.147, "r_x2": 153.691, "r_y2": 483.595, "r_x3": 134.872, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 492.147, "r_x1": 194.0, "r_y1": 492.147, "r_x2": 194.0, "r_y2": 483.595, "r_x3": 176.566, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 218.339, "r_y0": 492.147, "r_x1": 240.755, "r_y1": 492.147, "r_x2": 240.755, "r_y2": 483.595, "r_x3": 218.339, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 492.147, "r_x1": 279.619, "r_y1": 492.147, "r_x2": 279.619, "r_y2": 483.595, "r_x3": 262.184, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.165, "r_y0": 504.102, "r_x1": 101.532, "r_y1": 504.102, "r_x2": 101.532, "r_y2": 495.55, "r_x3": 82.165, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.867, "r_y0": 504.102, "r_x1": 153.687, "r_y1": 504.102, "r_x2": 153.687, "r_y2": 495.55, "r_x3": 134.867, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.624, "r_y0": 504.102, "r_x1": 186.942, "r_y1": 504.102, "r_x2": 186.942, "r_y2": 495.55, "r_x3": 183.624, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 504.102, "r_x1": 231.205, "r_y1": 504.102, "r_x2": 231.205, "r_y2": 495.55, "r_x3": 227.888, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.699, "r_y0": 504.102, "r_x1": 282.114, "r_y1": 504.102, "r_x2": 282.114, "r_y2": 495.55, "r_x3": 259.699, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 71.789, "r_y0": 516.057, "r_x1": 111.908, "r_y1": 516.057, "r_x2": 111.908, "r_y2": 507.505, "r_x3": 71.789, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.862, "r_y0": 516.057, "r_x1": 153.682, "r_y1": 516.057, "r_x2": 153.682, "r_y2": 507.505, "r_x3": 134.862, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.629, "r_y0": 516.057, "r_x1": 186.947, "r_y1": 516.057, "r_x2": 186.947, "r_y2": 507.505, "r_x3": 183.629, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.893, "r_y0": 516.057, "r_x1": 231.211, "r_y1": 516.057, "r_x2": 231.211, "r_y2": 507.505, "r_x3": 227.893, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.694, "r_y0": 516.057, "r_x1": 282.109, "r_y1": 516.057, "r_x2": 282.109, "r_y2": 507.505, "r_x3": 259.694, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 528.012, "r_x1": 117.383, "r_y1": 528.012, "r_x2": 117.383, "r_y2": 519.46, "r_x3": 66.315, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 528.012, "r_x1": 153.687, "r_y1": 528.012, "r_x2": 153.687, "r_y2": 519.46, "r_x3": 134.868, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 528.012, "r_x1": 194.006, "r_y1": 528.012, "r_x2": 194.006, "r_y2": 519.46, "r_x3": 176.571, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 528.012, "r_x1": 238.269, "r_y1": 528.012, "r_x2": 238.269, "r_y2": 519.46, "r_x3": 220.835, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.189, "r_y0": 528.028, "r_x1": 279.624, "r_y1": 528.028, "r_x2": 279.624, "r_y2": 519.072, "r_x3": 262.189, "r_y3": 519.072, "coord_origin": "TOPLEFT"}, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 545.319, "r_x1": 102.085, "r_y1": 545.319, "r_x2": 102.085, "r_y2": 536.767, "r_x3": 81.612, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.911, "r_y0": 545.319, "r_x1": 150.643, "r_y1": 545.319, "r_x2": 150.643, "r_y2": 536.767, "r_x3": 137.911, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 545.319, "r_x1": 194.0, "r_y1": 545.319, "r_x2": 194.0, "r_y2": 536.767, "r_x3": 176.566, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.893, "r_y0": 545.319, "r_x1": 231.21, "r_y1": 545.319, "r_x2": 231.21, "r_y2": 536.767, "r_x3": 227.893, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 545.319, "r_x1": 279.619, "r_y1": 545.319, "r_x2": 279.619, "r_y2": 536.767, "r_x3": 262.184, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 557.275, "r_x1": 117.383, "r_y1": 557.275, "r_x2": 117.383, "r_y2": 548.723, "r_x3": 66.315, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.906, "r_y0": 557.275, "r_x1": 150.638, "r_y1": 557.275, "r_x2": 150.638, "r_y2": 548.723, "r_x3": 137.906, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 557.275, "r_x1": 194.006, "r_y1": 557.275, "r_x2": 194.006, "r_y2": 548.723, "r_x3": 176.571, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 557.275, "r_x1": 231.206, "r_y1": 557.275, "r_x2": 231.206, "r_y2": 548.723, "r_x3": 227.888, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.189, "r_y0": 557.2909999999999, "r_x1": 279.624, "r_y1": 557.2909999999999, "r_x2": 279.624, "r_y2": 548.335, "r_x3": 262.189, "r_y3": 548.335, "coord_origin": "TOPLEFT"}, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 576.823, "r_x1": 117.383, "r_y1": 576.823, "r_x2": 117.383, "r_y2": 568.271, "r_x3": 66.315, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 576.823, "r_x1": 153.687, "r_y1": 576.823, "r_x2": 153.687, "r_y2": 568.271, "r_x3": 134.868, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 576.823, "r_x1": 194.006, "r_y1": 576.823, "r_x2": 194.006, "r_y2": 568.271, "r_x3": 176.571, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 576.823, "r_x1": 238.269, "r_y1": 576.823, "r_x2": 238.269, "r_y2": 568.271, "r_x3": 220.835, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.19, "r_y0": 576.823, "r_x1": 279.624, "r_y1": 576.823, "r_x2": 279.624, "r_y2": 568.271, "r_x3": 262.19, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 27, "label": "text", "bbox": {"l": 78.843, "t": 420.959, "r": 104.855, "b": 429.511, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.843, "r_y0": 429.511, "r_x1": 104.855, "r_y1": 429.511, "r_x2": 104.855, "r_y2": 420.959, "r_x3": 78.843, "r_y3": 420.959, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 211.2, "t": 414.981, "r": 236.107, "b": 423.533, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.2, "r_y0": 423.533, "r_x1": 236.107, "r_y1": 423.533, "r_x2": 236.107, "r_y2": 414.981, "r_x3": 211.2, "r_y3": 414.981, "coord_origin": "TOPLEFT"}, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 129.338, "t": 426.936, "r": 159.216, "b": 435.488, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.338, "r_y0": 435.488, "r_x1": 159.216, "r_y1": 435.488, "r_x2": 159.216, "r_y2": 426.936, "r_x3": 129.338, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 171.171, "t": 426.936, "r": 199.405, "b": 435.488, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.171, "r_y0": 435.488, "r_x1": 199.405, "r_y1": 435.488, "r_x2": 199.405, "r_y2": 426.936, "r_x3": 171.171, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 211.36, "t": 426.936, "r": 247.744, "b": 435.488, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.36, "r_y0": 435.488, "r_x1": 247.744, "r_y1": 435.488, "r_x2": 247.744, "r_y2": 426.936, "r_x3": 211.36, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 264.54, "t": 426.936, "r": 277.273, "b": 435.488, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.54, "r_y0": 435.488, "r_x1": 277.273, "r_y1": 435.488, "r_x2": 277.273, "r_y2": 426.936, "r_x3": 264.54, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 81.612, "t": 443.893, "r": 102.085, "b": 452.445, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 452.445, "r_x1": 102.085, "r_y1": 452.445, "r_x2": 102.085, "r_y2": 443.893, "r_x3": 81.612, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 134.872, "t": 443.893, "r": 153.691, "b": 452.445, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.872, "r_y0": 452.445, "r_x1": 153.691, "r_y1": 452.445, "r_x2": 153.691, "r_y2": 443.893, "r_x3": 134.872, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 176.566, "t": 443.893, "r": 194.0, "b": 452.445, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 452.445, "r_x1": 194.0, "r_y1": 452.445, "r_x2": 194.0, "r_y2": 443.893, "r_x3": 176.566, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 220.829, "t": 443.893, "r": 238.264, "b": 452.445, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.829, "r_y0": 452.445, "r_x1": 238.264, "r_y1": 452.445, "r_x2": 238.264, "r_y2": 443.893, "r_x3": 220.829, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 262.184, "t": 443.893, "r": 279.619, "b": 452.445, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 452.445, "r_x1": 279.619, "r_y1": 452.445, "r_x2": 279.619, "r_y2": 443.893, "r_x3": 262.184, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 82.165, "t": 455.849, "r": 101.532, "b": 464.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.165, "r_y0": 464.401, "r_x1": 101.532, "r_y1": 464.401, "r_x2": 101.532, "r_y2": 455.849, "r_x3": 82.165, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 134.867, "t": 455.849, "r": 153.687, "b": 464.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.867, "r_y0": 464.401, "r_x1": 153.687, "r_y1": 464.401, "r_x2": 153.687, "r_y2": 455.849, "r_x3": 134.867, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 183.624, "t": 455.849, "r": 186.942, "b": 464.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.624, "r_y0": 464.401, "r_x1": 186.942, "r_y1": 464.401, "r_x2": 186.942, "r_y2": 455.849, "r_x3": 183.624, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 227.888, "t": 455.849, "r": 231.205, "b": 464.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 464.401, "r_x1": 231.205, "r_y1": 464.401, "r_x2": 231.205, "r_y2": 455.849, "r_x3": 227.888, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 259.699, "t": 455.849, "r": 282.114, "b": 464.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.699, "r_y0": 464.401, "r_x1": 282.114, "r_y1": 464.401, "r_x2": 282.114, "r_y2": 455.849, "r_x3": 259.699, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 66.315, "t": 468.402, "r": 117.383, "b": 476.954, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 476.954, "r_x1": 117.383, "r_y1": 476.954, "r_x2": 117.383, "r_y2": 468.402, "r_x3": 66.315, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 134.868, "t": 468.402, "r": 153.687, "b": 476.954, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 476.954, "r_x1": 153.687, "r_y1": 476.954, "r_x2": 153.687, "r_y2": 468.402, "r_x3": 134.868, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 176.571, "t": 468.402, "r": 194.006, "b": 476.954, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 476.954, "r_x1": 194.006, "r_y1": 476.954, "r_x2": 194.006, "r_y2": 468.402, "r_x3": 176.571, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 220.835, "t": 468.402, "r": 238.269, "b": 476.954, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 476.954, "r_x1": 238.269, "r_y1": 476.954, "r_x2": 238.269, "r_y2": 468.402, "r_x3": 220.835, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 259.698, "t": 468.014, "r": 282.114, "b": 476.97, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.698, "r_y0": 476.97, "r_x1": 282.114, "r_y1": 476.97, "r_x2": 282.114, "r_y2": 468.014, "r_x3": 259.698, "r_y3": 468.014, "coord_origin": "TOPLEFT"}, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 81.612, "t": 483.595, "r": 102.085, "b": 492.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 492.147, "r_x1": 102.085, "r_y1": 492.147, "r_x2": 102.085, "r_y2": 483.595, "r_x3": 81.612, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 134.872, "t": 483.595, "r": 153.691, "b": 492.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.872, "r_y0": 492.147, "r_x1": 153.691, "r_y1": 492.147, "r_x2": 153.691, "r_y2": 483.595, "r_x3": 134.872, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 176.566, "t": 483.595, "r": 194.0, "b": 492.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 492.147, "r_x1": 194.0, "r_y1": 492.147, "r_x2": 194.0, "r_y2": 483.595, "r_x3": 176.566, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 218.339, "t": 483.595, "r": 240.755, "b": 492.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 218.339, "r_y0": 492.147, "r_x1": 240.755, "r_y1": 492.147, "r_x2": 240.755, "r_y2": 483.595, "r_x3": 218.339, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 262.184, "t": 483.595, "r": 279.619, "b": 492.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 492.147, "r_x1": 279.619, "r_y1": 492.147, "r_x2": 279.619, "r_y2": 483.595, "r_x3": 262.184, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 82.165, "t": 495.55, "r": 101.532, "b": 504.102, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.165, "r_y0": 504.102, "r_x1": 101.532, "r_y1": 504.102, "r_x2": 101.532, "r_y2": 495.55, "r_x3": 82.165, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 134.867, "t": 495.55, "r": 153.687, "b": 504.102, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.867, "r_y0": 504.102, "r_x1": 153.687, "r_y1": 504.102, "r_x2": 153.687, "r_y2": 495.55, "r_x3": 134.867, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 183.624, "t": 495.55, "r": 186.942, "b": 504.102, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.624, "r_y0": 504.102, "r_x1": 186.942, "r_y1": 504.102, "r_x2": 186.942, "r_y2": 495.55, "r_x3": 183.624, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 227.888, "t": 495.55, "r": 231.205, "b": 504.102, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 504.102, "r_x1": 231.205, "r_y1": 504.102, "r_x2": 231.205, "r_y2": 495.55, "r_x3": 227.888, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 259.699, "t": 495.55, "r": 282.114, "b": 504.102, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.699, "r_y0": 504.102, "r_x1": 282.114, "r_y1": 504.102, "r_x2": 282.114, "r_y2": 495.55, "r_x3": 259.699, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 71.789, "t": 507.505, "r": 111.908, "b": 516.057, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 71.789, "r_y0": 516.057, "r_x1": 111.908, "r_y1": 516.057, "r_x2": 111.908, "r_y2": 507.505, "r_x3": 71.789, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 134.862, "t": 507.505, "r": 153.682, "b": 516.057, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.862, "r_y0": 516.057, "r_x1": 153.682, "r_y1": 516.057, "r_x2": 153.682, "r_y2": 507.505, "r_x3": 134.862, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 183.629, "t": 507.505, "r": 186.947, "b": 516.057, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.629, "r_y0": 516.057, "r_x1": 186.947, "r_y1": 516.057, "r_x2": 186.947, "r_y2": 507.505, "r_x3": 183.629, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 227.893, "t": 507.505, "r": 231.211, "b": 516.057, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.893, "r_y0": 516.057, "r_x1": 231.211, "r_y1": 516.057, "r_x2": 231.211, "r_y2": 507.505, "r_x3": 227.893, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 259.694, "t": 507.505, "r": 282.109, "b": 516.057, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.694, "r_y0": 516.057, "r_x1": 282.109, "r_y1": 516.057, "r_x2": 282.109, "r_y2": 507.505, "r_x3": 259.694, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 66.315, "t": 519.46, "r": 117.383, "b": 528.012, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 528.012, "r_x1": 117.383, "r_y1": 528.012, "r_x2": 117.383, "r_y2": 519.46, "r_x3": 66.315, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 134.868, "t": 519.46, "r": 153.687, "b": 528.012, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 528.012, "r_x1": 153.687, "r_y1": 528.012, "r_x2": 153.687, "r_y2": 519.46, "r_x3": 134.868, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 176.571, "t": 519.46, "r": 194.006, "b": 528.012, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 528.012, "r_x1": 194.006, "r_y1": 528.012, "r_x2": 194.006, "r_y2": 519.46, "r_x3": 176.571, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 220.835, "t": 519.46, "r": 238.269, "b": 528.012, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 528.012, "r_x1": 238.269, "r_y1": 528.012, "r_x2": 238.269, "r_y2": 519.46, "r_x3": 220.835, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 262.189, "t": 519.072, "r": 279.624, "b": 528.028, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.189, "r_y0": 528.028, "r_x1": 279.624, "r_y1": 528.028, "r_x2": 279.624, "r_y2": 519.072, "r_x3": 262.189, "r_y3": 519.072, "coord_origin": "TOPLEFT"}, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 81.612, "t": 536.767, "r": 102.085, "b": 545.319, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 545.319, "r_x1": 102.085, "r_y1": 545.319, "r_x2": 102.085, "r_y2": 536.767, "r_x3": 81.612, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 137.911, "t": 536.767, "r": 150.643, "b": 545.319, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.911, "r_y0": 545.319, "r_x1": 150.643, "r_y1": 545.319, "r_x2": 150.643, "r_y2": 536.767, "r_x3": 137.911, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 176.566, "t": 536.767, "r": 194.0, "b": 545.319, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 545.319, "r_x1": 194.0, "r_y1": 545.319, "r_x2": 194.0, "r_y2": 536.767, "r_x3": 176.566, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 227.893, "t": 536.767, "r": 231.21, "b": 545.319, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.893, "r_y0": 545.319, "r_x1": 231.21, "r_y1": 545.319, "r_x2": 231.21, "r_y2": 536.767, "r_x3": 227.893, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 262.184, "t": 536.767, "r": 279.619, "b": 545.319, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 545.319, "r_x1": 279.619, "r_y1": 545.319, "r_x2": 279.619, "r_y2": 536.767, "r_x3": 262.184, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 66.315, "t": 548.723, "r": 117.383, "b": 557.275, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 557.275, "r_x1": 117.383, "r_y1": 557.275, "r_x2": 117.383, "r_y2": 548.723, "r_x3": 66.315, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 137.906, "t": 548.723, "r": 150.638, "b": 557.275, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.906, "r_y0": 557.275, "r_x1": 150.638, "r_y1": 557.275, "r_x2": 150.638, "r_y2": 548.723, "r_x3": 137.906, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 176.571, "t": 548.723, "r": 194.006, "b": 557.275, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 557.275, "r_x1": 194.006, "r_y1": 557.275, "r_x2": 194.006, "r_y2": 548.723, "r_x3": 176.571, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 227.888, "t": 548.723, "r": 231.206, "b": 557.275, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 557.275, "r_x1": 231.206, "r_y1": 557.275, "r_x2": 231.206, "r_y2": 548.723, "r_x3": 227.888, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 262.189, "t": 548.335, "r": 279.624, "b": 557.2909999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.189, "r_y0": 557.2909999999999, "r_x1": 279.624, "r_y1": 557.2909999999999, "r_x2": 279.624, "r_y2": 548.335, "r_x3": 262.189, "r_y3": 548.335, "coord_origin": "TOPLEFT"}, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 66.315, "t": 568.271, "r": 117.383, "b": 576.823, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 576.823, "r_x1": 117.383, "r_y1": 576.823, "r_x2": 117.383, "r_y2": 568.271, "r_x3": 66.315, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 134.868, "t": 568.271, "r": 153.687, "b": 576.823, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 576.823, "r_x1": 153.687, "r_y1": 576.823, "r_x2": 153.687, "r_y2": 568.271, "r_x3": 134.868, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 176.571, "t": 568.271, "r": 194.006, "b": 576.823, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 576.823, "r_x1": 194.006, "r_y1": 576.823, "r_x2": 194.006, "r_y2": 568.271, "r_x3": 176.571, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 220.835, "t": 568.271, "r": 238.269, "b": 576.823, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 576.823, "r_x1": 238.269, "r_y1": 576.823, "r_x2": 238.269, "r_y2": 568.271, "r_x3": 220.835, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 82, "label": "text", "bbox": {"l": 262.19, "t": 568.271, "r": 279.624, "b": 576.823, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.19, "r_y0": 576.823, "r_x1": 279.624, "r_y1": 576.823, "r_x2": 279.624, "r_y2": 568.271, "r_x3": 262.19, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 15, "label": "text", "bbox": {"l": 50.112, "t": 592.702, "r": 286.365, "b": 613.2090000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.7209173440933228, "cells": [{"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 601.254, "r_x1": 82.062, "r_y1": 601.254, "r_x2": 82.062, "r_y2": 592.702, "r_x3": 50.112, "r_y3": 592.702, "coord_origin": "TOPLEFT"}, "text": "Table 2:", "orig": "Table 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.382, "r_y0": 601.254, "r_x1": 286.365, "r_y1": 601.254, "r_x2": 286.365, "r_y2": 592.702, "r_x3": 87.382, "r_y3": 592.702, "coord_origin": "TOPLEFT"}, "text": "Structure results on PubTabNet (PTN), FinTabNet", "orig": "Structure results on PubTabNet (PTN), FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 613.2090000000001, "r_x1": 247.461, "r_y1": 613.2090000000001, "r_x2": 247.461, "r_y2": 604.657, "r_x3": 50.112, "r_y3": 604.657, "coord_origin": "TOPLEFT"}, "text": "(FTN), TableBank (TB) and SynthTabNet (STN).", "orig": "(FTN), TableBank (TB) and SynthTabNet (STN).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 50.112, "t": 616.612, "r": 261.787, "b": 625.164, "coord_origin": "TOPLEFT"}, "confidence": 0.6433312892913818, "cells": [{"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 625.164, "r_x1": 261.787, "r_y1": 625.164, "r_x2": 261.787, "r_y2": 616.612, "r_x3": 50.112, "r_y3": 616.612, "coord_origin": "TOPLEFT"}, "text": "FT: Model was trained on PubTabNet then finetuned.", "orig": "FT: Model was trained on PubTabNet then finetuned.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 50.112, "t": 644.35, "r": 286.366, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9854635000228882, "cells": [{"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 653.306, "r_x1": 124.722, "r_y1": 653.306, "r_x2": 124.722, "r_y2": 644.35, "r_x3": 62.067, "r_y3": 644.35, "coord_origin": "TOPLEFT"}, "text": "Cell Detection.", "orig": "Cell Detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.204, "r_y0": 653.29, "r_x1": 242.933, "r_y1": 653.29, "r_x2": 242.933, "r_y2": 644.738, "r_x3": 128.204, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "Like any object detector, our", "orig": "Like any object detector, our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.554, "r_y0": 653.1469999999999, "r_x1": 286.361, "r_y1": 653.1469999999999, "r_x2": 286.361, "r_y2": 644.559, "r_x3": 245.554, "r_y3": 644.559, "coord_origin": "TOPLEFT"}, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 665.102, "r_x1": 84.971, "r_y1": 665.102, "r_x2": 84.971, "r_y2": 656.514, "r_x3": 50.112, "r_y3": 656.514, "coord_origin": "TOPLEFT"}, "text": "Detector", "orig": "Detector", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 89.515, "r_y0": 665.245, "r_x1": 123.677, "r_y1": 665.245, "r_x2": 123.677, "r_y2": 656.693, "r_x3": 89.515, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "provides", "orig": "provides", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 127.991, "r_y0": 665.245, "r_x1": 286.366, "r_y1": 665.245, "r_x2": 286.366, "r_y2": 656.693, "r_x3": 127.991, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "bounding boxes that can be improved", "orig": "bounding boxes that can be improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.2, "r_x1": 286.365, "r_y1": 677.2, "r_x2": 286.365, "r_y2": 668.648, "r_x3": 50.112, "r_y3": 668.648, "coord_origin": "TOPLEFT"}, "text": "with post-processing during inference. We make use of the", "orig": "with post-processing during inference. We make use of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 259.655, "r_y1": 689.156, "r_x2": 259.655, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "grid-like structure of tables to refine the predictions.", "orig": "grid-like structure of tables to refine the predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.65, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 263.65, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "A de-", "orig": "A de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "tailed explanation on the post-processing is available in the", "orig": "tailed explanation on the post-processing is available in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 147.068, "r_y1": 713.066, "r_x2": 147.068, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "supplementary material.", "orig": "supplementary material.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.159, "r_y0": 713.066, "r_x1": 223.003, "r_y1": 713.066, "r_x2": 223.003, "r_y2": 704.514, "r_x3": 152.159, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "As shown in Tab.", "orig": "As shown in Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.094, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 228.094, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "3, we evaluate", "orig": "3, we evaluate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "text", "bbox": {"l": 308.862, "t": 75.298, "r": 545.115, "b": 227.49099999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9713197946548462, "cells": [{"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 322.142, "r_y1": 84.029, "r_x2": 322.142, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 325.454, "r_y0": 83.88599999999997, "r_x1": 404.567, "r_y1": 83.88599999999997, "r_x2": 404.567, "r_y2": 75.298, "r_x3": 325.454, "r_y3": 75.298, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.104, "r_y0": 84.029, "r_x1": 545.11, "r_y1": 84.029, "r_x2": 545.11, "r_y2": 75.47699999999998, "r_x3": 408.104, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "accuracy for cells with a class la-", "orig": "accuracy for cells with a class la-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 95.98400000000004, "r_x1": 545.115, "r_y1": 95.98400000000004, "r_x2": 545.115, "r_y2": 87.43200000000002, "r_x3": 308.862, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "bel of 'content' only using the PASCAL VOC mAP metric", "orig": "bel of 'content' only using the PASCAL VOC mAP metric", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 107.93899999999996, "r_x1": 320.478, "r_y1": 107.93899999999996, "r_x2": 320.478, "r_y2": 99.38699999999994, "r_x3": 308.862, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 324.374, "r_y0": 107.93899999999996, "r_x1": 470.226, "r_y1": 107.93899999999996, "r_x2": 470.226, "r_y2": 99.38699999999994, "r_x3": 324.374, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "pre-processing and post-processing.", "orig": "pre-processing and post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.529, "r_y0": 107.93899999999996, "r_x1": 545.115, "r_y1": 107.93899999999996, "r_x2": 545.115, "r_y2": 99.38699999999994, "r_x3": 477.529, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "Note that we do", "orig": "Note that we do", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 119.894, "r_x1": 545.115, "r_y1": 119.894, "r_x2": 545.115, "r_y2": 111.34199999999998, "r_x3": 308.862, "r_y3": 111.34199999999998, "coord_origin": "TOPLEFT"}, "text": "not have post-processing results for SynthTabNet as images", "orig": "not have post-processing results for SynthTabNet as images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 131.84900000000005, "r_x1": 545.115, "r_y1": 131.84900000000005, "r_x2": 545.115, "r_y2": 123.29700000000003, "r_x3": 308.862, "r_y3": 123.29700000000003, "coord_origin": "TOPLEFT"}, "text": "are only provided. To compare the performance of our pro-", "orig": "are only provided. To compare the performance of our pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 143.80499999999995, "r_x1": 502.017, "r_y1": 143.80499999999995, "r_x2": 502.017, "r_y2": 135.25300000000004, "r_x3": 308.862, "r_y3": 135.25300000000004, "coord_origin": "TOPLEFT"}, "text": "posed approach, we've integrated TableFormer's", "orig": "posed approach, we've integrated TableFormer's", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 504.473, "r_y0": 143.66200000000003, "r_x1": 545.11, "r_y1": 143.66200000000003, "r_x2": 545.11, "r_y2": 135.07399999999996, "r_x3": 504.473, "r_y3": 135.07399999999996, "coord_origin": "TOPLEFT"}, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 155.61699999999996, "r_x1": 343.163, "r_y1": 155.61699999999996, "r_x2": 343.163, "r_y2": 147.029, "r_x3": 308.862, "r_y3": 147.029, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.371, "r_y0": 155.76, "r_x1": 437.818, "r_y1": 155.76, "r_x2": 437.818, "r_y2": 147.20799999999997, "r_x3": 346.371, "r_y3": 147.20799999999997, "coord_origin": "TOPLEFT"}, "text": "into EDD architecture.", "orig": "into EDD architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.371, "r_y0": 155.76, "r_x1": 545.115, "r_y1": 155.76, "r_x2": 545.115, "r_y2": 147.20799999999997, "r_x3": 442.371, "r_y3": 147.20799999999997, "coord_origin": "TOPLEFT"}, "text": "As mentioned previously,", "orig": "As mentioned previously,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 167.71500000000003, "r_x1": 446.157, "r_y1": 167.71500000000003, "r_x2": 446.157, "r_y2": 159.163, "r_x3": 308.862, "r_y3": 159.163, "coord_origin": "TOPLEFT"}, "text": "the Structure Decoder provides the", "orig": "the Structure Decoder provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.29, "r_y0": 167.572, "r_x1": 525.042, "r_y1": 167.572, "r_x2": 525.042, "r_y2": 158.98400000000004, "r_x3": 448.29, "r_y3": 158.98400000000004, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 527.399, "r_y0": 167.71500000000003, "r_x1": 545.113, "r_y1": 167.71500000000003, "r_x2": 545.113, "r_y2": 159.163, "r_x3": 527.399, "r_y3": 159.163, "coord_origin": "TOPLEFT"}, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 179.66999999999996, "r_x1": 545.115, "r_y1": 179.66999999999996, "r_x2": 545.115, "r_y2": 171.11800000000005, "r_x3": 308.862, "r_y3": 171.11800000000005, "coord_origin": "TOPLEFT"}, "text": "the features needed to predict the bounding box predictions.", "orig": "the features needed to predict the bounding box predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 191.625, "r_x1": 432.866, "r_y1": 191.625, "r_x2": 432.866, "r_y2": 183.07299999999998, "r_x3": 308.862, "r_y3": 183.07299999999998, "coord_origin": "TOPLEFT"}, "text": "Therefore, the accuracy of the", "orig": "Therefore, the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.39, "r_y0": 191.48199999999997, "r_x1": 510.93, "r_y1": 191.48199999999997, "r_x2": 510.93, "r_y2": 182.894, "r_x3": 436.39, "r_y3": 182.894, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 514.677, "r_y0": 191.625, "r_x1": 545.113, "r_y1": 191.625, "r_x2": 545.113, "r_y2": 183.07299999999998, "r_x3": 514.677, "r_y3": 183.07299999999998, "coord_origin": "TOPLEFT"}, "text": "directly", "orig": "directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 203.58000000000004, "r_x1": 431.173, "r_y1": 203.58000000000004, "r_x2": 431.173, "r_y2": 195.02800000000002, "r_x3": 308.862, "r_y3": 195.02800000000002, "coord_origin": "TOPLEFT"}, "text": "influences the accuracy of the", "orig": "influences the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 434.679, "r_y0": 203.437, "r_x1": 514.181, "r_y1": 203.437, "r_x2": 514.181, "r_y2": 194.84900000000005, "r_x3": 434.679, "r_y3": 194.84900000000005, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 514.176, "r_y0": 203.58000000000004, "r_x1": 516.667, "r_y1": 203.58000000000004, "r_x2": 516.667, "r_y2": 195.02800000000002, "r_x3": 514.176, "r_y3": 195.02800000000002, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 522.794, "r_y0": 203.58000000000004, "r_x1": 529.429, "r_y1": 203.58000000000004, "r_x2": 529.429, "r_y2": 195.02800000000002, "r_x3": 522.794, "r_y3": 195.02800000000002, "coord_origin": "TOPLEFT"}, "text": "If", "orig": "If", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.936, "r_y0": 203.58000000000004, "r_x1": 545.11, "r_y1": 203.58000000000004, "r_x2": 545.11, "r_y2": 195.02800000000002, "r_x3": 532.936, "r_y3": 195.02800000000002, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 215.39300000000003, "r_x1": 382.356, "r_y1": 215.39300000000003, "r_x2": 382.356, "r_y2": 206.80499999999995, "r_x3": 308.862, "r_y3": 206.80499999999995, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.075, "r_y0": 215.53599999999994, "r_x1": 545.114, "r_y1": 215.53599999999994, "r_x2": 545.114, "r_y2": 206.98400000000004, "r_x3": 385.075, "r_y3": 206.98400000000004, "coord_origin": "TOPLEFT"}, "text": "predicts an extra column, this will result", "orig": "predicts an extra column, this will result", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 227.49099999999999, "r_x1": 501.698, "r_y1": 227.49099999999999, "r_x2": 501.698, "r_y2": 218.93899999999996, "r_x3": 308.862, "r_y3": 218.93899999999996, "coord_origin": "TOPLEFT"}, "text": "in an extra column of predicted bounding boxes.", "orig": "in an extra column of predicted bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "table", "bbox": {"l": 308.4068603515625, "t": 247.87631225585938, "r": 533.6419677734375, "b": 303.8056640625, "coord_origin": "TOPLEFT"}, "confidence": 0.9691730737686157, "cells": [{"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.323, "r_y0": 262.485, "r_x1": 365.335, "r_y1": 262.485, "r_x2": 365.335, "r_y2": 253.933, "r_x3": 339.323, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.041, "r_y0": 262.485, "r_x1": 430.919, "r_y1": 262.485, "r_x2": 430.919, "r_y2": 253.933, "r_x3": 401.041, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.102, "r_y0": 262.485, "r_x1": 474.585, "r_y1": 262.485, "r_x2": 474.585, "r_y2": 253.933, "r_x3": 454.102, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 486.54, "r_y0": 262.485, "r_x1": 527.228, "r_y1": 262.485, "r_x2": 527.228, "r_y2": 253.933, "r_x3": 486.54, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.656, "r_y0": 279.442, "r_x1": 377.001, "r_y1": 279.442, "r_x2": 377.001, "r_y2": 270.89, "r_x3": 327.656, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.698, "r_y0": 279.442, "r_x1": 438.281, "r_y1": 279.442, "r_x2": 438.281, "r_y2": 270.89, "r_x3": 393.698, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.636, "r_y0": 279.442, "r_x1": 473.07, "r_y1": 279.442, "r_x2": 473.07, "r_y2": 270.89, "r_x3": 455.636, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.166, "r_y0": 279.442, "r_x1": 515.6, "r_y1": 279.442, "r_x2": 515.6, "r_y2": 270.89, "r_x3": 498.166, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 291.397, "r_x1": 377.863, "r_y1": 291.397, "r_x2": 377.863, "r_y2": 282.845, "r_x3": 326.795, "r_y3": 282.845, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.694, "r_y0": 291.397, "r_x1": 438.276, "r_y1": 291.397, "r_x2": 438.276, "r_y2": 282.845, "r_x3": 393.694, "r_y3": 282.845, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.631, "r_y0": 291.413, "r_x1": 473.066, "r_y1": 291.413, "r_x2": 473.066, "r_y2": 282.457, "r_x3": 455.631, "r_y3": 282.457, "coord_origin": "TOPLEFT"}, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.171, "r_y0": 291.413, "r_x1": 515.606, "r_y1": 291.413, "r_x2": 515.606, "r_y2": 282.457, "r_x3": 498.171, "r_y3": 282.457, "coord_origin": "TOPLEFT"}, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 303.352, "r_x1": 377.863, "r_y1": 303.352, "r_x2": 377.863, "r_y2": 294.8, "r_x3": 326.795, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 389.818, "r_y0": 303.352, "r_x1": 442.152, "r_y1": 303.352, "r_x2": 442.152, "r_y2": 294.8, "r_x3": 389.818, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.631, "r_y0": 303.352, "r_x1": 473.066, "r_y1": 303.352, "r_x2": 473.066, "r_y2": 294.8, "r_x3": 455.631, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 505.225, "r_y0": 303.352, "r_x1": 508.543, "r_y1": 303.352, "r_x2": 508.543, "r_y2": 294.8, "r_x3": 505.225, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 83, "label": "text", "bbox": {"l": 339.323, "t": 253.933, "r": 365.335, "b": 262.485, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.323, "r_y0": 262.485, "r_x1": 365.335, "r_y1": 262.485, "r_x2": 365.335, "r_y2": 253.933, "r_x3": 339.323, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 401.041, "t": 253.933, "r": 430.919, "b": 262.485, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.041, "r_y0": 262.485, "r_x1": 430.919, "r_y1": 262.485, "r_x2": 430.919, "r_y2": 253.933, "r_x3": 401.041, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 454.102, "t": 253.933, "r": 474.585, "b": 262.485, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.102, "r_y0": 262.485, "r_x1": 474.585, "r_y1": 262.485, "r_x2": 474.585, "r_y2": 253.933, "r_x3": 454.102, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 86, "label": "text", "bbox": {"l": 486.54, "t": 253.933, "r": 527.228, "b": 262.485, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 486.54, "r_y0": 262.485, "r_x1": 527.228, "r_y1": 262.485, "r_x2": 527.228, "r_y2": 253.933, "r_x3": 486.54, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 327.656, "t": 270.89, "r": 377.001, "b": 279.442, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.656, "r_y0": 279.442, "r_x1": 377.001, "r_y1": 279.442, "r_x2": 377.001, "r_y2": 270.89, "r_x3": 327.656, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 88, "label": "text", "bbox": {"l": 393.698, "t": 270.89, "r": 438.281, "b": 279.442, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.698, "r_y0": 279.442, "r_x1": 438.281, "r_y1": 279.442, "r_x2": 438.281, "r_y2": 270.89, "r_x3": 393.698, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 455.636, "t": 270.89, "r": 473.07, "b": 279.442, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.636, "r_y0": 279.442, "r_x1": 473.07, "r_y1": 279.442, "r_x2": 473.07, "r_y2": 270.89, "r_x3": 455.636, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 498.166, "t": 270.89, "r": 515.6, "b": 279.442, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.166, "r_y0": 279.442, "r_x1": 515.6, "r_y1": 279.442, "r_x2": 515.6, "r_y2": 270.89, "r_x3": 498.166, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 91, "label": "text", "bbox": {"l": 326.795, "t": 282.845, "r": 377.863, "b": 291.397, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 291.397, "r_x1": 377.863, "r_y1": 291.397, "r_x2": 377.863, "r_y2": 282.845, "r_x3": 326.795, "r_y3": 282.845, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 92, "label": "text", "bbox": {"l": 393.694, "t": 282.845, "r": 438.276, "b": 291.397, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.694, "r_y0": 291.397, "r_x1": 438.276, "r_y1": 291.397, "r_x2": 438.276, "r_y2": 282.845, "r_x3": 393.694, "r_y3": 282.845, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 93, "label": "text", "bbox": {"l": 455.631, "t": 282.457, "r": 473.066, "b": 291.413, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.631, "r_y0": 291.413, "r_x1": 473.066, "r_y1": 291.413, "r_x2": 473.066, "r_y2": 282.457, "r_x3": 455.631, "r_y3": 282.457, "coord_origin": "TOPLEFT"}, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 94, "label": "text", "bbox": {"l": 498.171, "t": 282.457, "r": 515.606, "b": 291.413, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.171, "r_y0": 291.413, "r_x1": 515.606, "r_y1": 291.413, "r_x2": 515.606, "r_y2": 282.457, "r_x3": 498.171, "r_y3": 282.457, "coord_origin": "TOPLEFT"}, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 95, "label": "text", "bbox": {"l": 326.795, "t": 294.8, "r": 377.863, "b": 303.352, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 303.352, "r_x1": 377.863, "r_y1": 303.352, "r_x2": 377.863, "r_y2": 294.8, "r_x3": 326.795, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 96, "label": "text", "bbox": {"l": 389.818, "t": 294.8, "r": 442.152, "b": 303.352, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 389.818, "r_y0": 303.352, "r_x1": 442.152, "r_y1": 303.352, "r_x2": 442.152, "r_y2": 294.8, "r_x3": 389.818, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 97, "label": "text", "bbox": {"l": 455.631, "t": 294.8, "r": 473.066, "b": 303.352, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.631, "r_y0": 303.352, "r_x1": 473.066, "r_y1": 303.352, "r_x2": 473.066, "r_y2": 294.8, "r_x3": 455.631, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 98, "label": "text", "bbox": {"l": 505.225, "t": 294.8, "r": 508.543, "b": 303.352, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 505.225, "r_y0": 303.352, "r_x1": 508.543, "r_y1": 303.352, "r_x2": 508.543, "r_y2": 294.8, "r_x3": 505.225, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 12, "label": "caption", "bbox": {"l": 308.862, "t": 316.718, "r": 545.115, "b": 337.225, "coord_origin": "TOPLEFT"}, "confidence": 0.9519917964935303, "cells": [{"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 325.27, "r_x1": 341.499, "r_y1": 325.27, "r_x2": 341.499, "r_y2": 316.718, "r_x3": 308.862, "r_y3": 316.718, "coord_origin": "TOPLEFT"}, "text": "Table 3:", "orig": "Table 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.603, "r_y0": 325.27, "r_x1": 545.115, "r_y1": 325.27, "r_x2": 545.115, "r_y2": 316.718, "r_x3": 348.603, "r_y3": 316.718, "coord_origin": "TOPLEFT"}, "text": "Cell Bounding Box detection results on PubTab-", "orig": "Cell Bounding Box detection results on PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 337.225, "r_x1": 474.978, "r_y1": 337.225, "r_x2": 474.978, "r_y2": 328.673, "r_x3": 308.862, "r_y3": 328.673, "coord_origin": "TOPLEFT"}, "text": "Net, and FinTabNet. PP: Post-processing.", "orig": "Net, and FinTabNet. PP: Post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "text", "bbox": {"l": 308.862, "t": 367.68, "r": 545.116, "b": 520.082, "coord_origin": "TOPLEFT"}, "confidence": 0.9835010766983032, "cells": [{"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 376.636, "r_x1": 378.949, "r_y1": 376.636, "r_x2": 378.949, "r_y2": 367.68, "r_x3": 320.817, "r_y3": 367.68, "coord_origin": "TOPLEFT"}, "text": "Cell Content.", "orig": "Cell Content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 387.079, "r_y0": 376.62, "r_x1": 395.378, "r_y1": 376.62, "r_x2": 395.378, "r_y2": 368.068, "r_x3": 387.079, "r_y3": 368.068, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 399.552, "r_y0": 376.62, "r_x1": 413.948, "r_y1": 376.62, "r_x2": 413.948, "r_y2": 368.068, "r_x3": 399.552, "r_y3": 368.068, "coord_origin": "TOPLEFT"}, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.112, "r_y0": 376.62, "r_x1": 448.827, "r_y1": 376.62, "r_x2": 448.827, "r_y2": 368.068, "r_x3": 418.112, "r_y3": 368.068, "coord_origin": "TOPLEFT"}, "text": "section,", "orig": "section,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.42, "r_y0": 376.62, "r_x1": 545.116, "r_y1": 376.62, "r_x2": 545.116, "r_y2": 368.068, "r_x3": 453.42, "r_y3": 368.068, "coord_origin": "TOPLEFT"}, "text": "we evaluate the entire", "orig": "we evaluate the entire", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 388.575, "r_x1": 487.193, "r_y1": 388.575, "r_x2": 487.193, "r_y2": 380.023, "r_x3": 308.862, "r_y3": 380.023, "coord_origin": "TOPLEFT"}, "text": "pipeline of recovering a table with content.", "orig": "pipeline of recovering a table with content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.967, "r_y0": 388.575, "r_x1": 545.115, "r_y1": 388.575, "r_x2": 545.115, "r_y2": 380.023, "r_x3": 493.967, "r_y3": 380.023, "coord_origin": "TOPLEFT"}, "text": "Here we put", "orig": "Here we put", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 400.53, "r_x1": 545.115, "r_y1": 400.53, "r_x2": 545.115, "r_y2": 391.978, "r_x3": 308.862, "r_y3": 391.978, "coord_origin": "TOPLEFT"}, "text": "our approach to test by capitalizing on extracting content", "orig": "our approach to test by capitalizing on extracting content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 412.486, "r_x1": 545.115, "r_y1": 412.486, "r_x2": 545.115, "r_y2": 403.934, "r_x3": 308.862, "r_y3": 403.934, "coord_origin": "TOPLEFT"}, "text": "from the PDF cells rather than decoding from images. Tab.", "orig": "from the PDF cells rather than decoding from images. Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 424.441, "r_x1": 545.115, "r_y1": 424.441, "r_x2": 545.115, "r_y2": 415.889, "r_x3": 308.862, "r_y3": 415.889, "coord_origin": "TOPLEFT"}, "text": "4 shows the TEDs score of HTML code representing the", "orig": "4 shows the TEDs score of HTML code representing the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 436.396, "r_x1": 545.115, "r_y1": 436.396, "r_x2": 545.115, "r_y2": 427.844, "r_x3": 308.862, "r_y3": 427.844, "coord_origin": "TOPLEFT"}, "text": "structure of the table along with the content inserted in the", "orig": "structure of the table along with the content inserted in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 203, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 448.351, "r_x1": 545.115, "r_y1": 448.351, "r_x2": 545.115, "r_y2": 439.799, "r_x3": 308.862, "r_y3": 439.799, "coord_origin": "TOPLEFT"}, "text": "data cell and compared with the ground-truth. Our method", "orig": "data cell and compared with the ground-truth. Our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 204, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 460.306, "r_x1": 350.237, "r_y1": 460.306, "r_x2": 350.237, "r_y2": 451.754, "r_x3": 308.862, "r_y3": 451.754, "coord_origin": "TOPLEFT"}, "text": "achieved a", "orig": "achieved a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 205, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 352.176, "r_y0": 460.322, "r_x1": 374.592, "r_y1": 460.322, "r_x2": 374.592, "r_y2": 451.366, "r_x3": 352.176, "r_y3": 451.366, "coord_origin": "TOPLEFT"}, "text": "5.3%", "orig": "5.3%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 206, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.533, "r_y0": 460.306, "r_x1": 545.11, "r_y1": 460.306, "r_x2": 545.11, "r_y2": 451.754, "r_x3": 376.533, "r_y3": 451.754, "coord_origin": "TOPLEFT"}, "text": "increase over the state-of-the-art, and com-", "orig": "increase over the state-of-the-art, and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 207, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 472.261, "r_x1": 380.523, "r_y1": 472.261, "r_x2": 380.523, "r_y2": 463.709, "r_x3": 308.862, "r_y3": 463.709, "coord_origin": "TOPLEFT"}, "text": "mercial solutions.", "orig": "mercial solutions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 208, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.042, "r_y0": 472.261, "r_x1": 545.115, "r_y1": 472.261, "r_x2": 545.115, "r_y2": 463.709, "r_x3": 386.042, "r_y3": 463.709, "coord_origin": "TOPLEFT"}, "text": "We believe our scores would be higher", "orig": "We believe our scores would be higher", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 209, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 484.217, "r_x1": 314.949, "r_y1": 484.217, "r_x2": 314.949, "r_y2": 475.665, "r_x3": 308.862, "r_y3": 475.665, "coord_origin": "TOPLEFT"}, "text": "if", "orig": "if", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 210, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.008, "r_y0": 484.217, "r_x1": 545.115, "r_y1": 484.217, "r_x2": 545.115, "r_y2": 475.665, "r_x3": 318.008, "r_y3": 475.665, "coord_origin": "TOPLEFT"}, "text": "the HTML ground-truth matched the extracted PDF cell", "orig": "the HTML ground-truth matched the extracted PDF cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 211, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 496.172, "r_x1": 340.683, "r_y1": 496.172, "r_x2": 340.683, "r_y2": 487.62, "r_x3": 308.862, "r_y3": 487.62, "coord_origin": "TOPLEFT"}, "text": "content.", "orig": "content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 212, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.793, "r_y0": 496.172, "r_x1": 545.115, "r_y1": 496.172, "r_x2": 545.115, "r_y2": 487.62, "r_x3": 345.793, "r_y3": 487.62, "coord_origin": "TOPLEFT"}, "text": "Unfortunately, there are small discrepancies such", "orig": "Unfortunately, there are small discrepancies such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 213, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 508.127, "r_x1": 545.115, "r_y1": 508.127, "r_x2": 545.115, "r_y2": 499.575, "r_x3": 308.862, "r_y3": 499.575, "coord_origin": "TOPLEFT"}, "text": "as spacings around words or special characters with various", "orig": "as spacings around words or special characters with various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 214, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 520.082, "r_x1": 405.698, "r_y1": 520.082, "r_x2": 405.698, "r_y2": 511.53, "r_x3": 308.862, "r_y3": 511.53, "coord_origin": "TOPLEFT"}, "text": "unicode representations.", "orig": "unicode representations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "table", "bbox": {"l": 332.9688720703125, "t": 540.2835693359375, "r": 520.942138671875, "b": 643.2697143554688, "coord_origin": "TOPLEFT"}, "confidence": 0.9775567650794983, "cells": [{"index": 215, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 358.011, "r_y0": 561.054, "r_x1": 384.023, "r_y1": 561.054, "r_x2": 384.023, "r_y2": 552.502, "r_x3": 358.011, "r_y3": 552.502, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 216, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.034, "r_y0": 555.076, "r_x1": 473.94, "r_y1": 555.076, "r_x2": 473.94, "r_y2": 546.524, "r_x3": 449.034, "r_y3": 546.524, "coord_origin": "TOPLEFT"}, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 217, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.506, "r_y0": 567.031, "r_x1": 436.74, "r_y1": 567.031, "r_x2": 436.74, "r_y2": 558.479, "r_x3": 408.506, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 218, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.695, "r_y0": 567.031, "r_x1": 485.079, "r_y1": 567.031, "r_x2": 485.079, "r_y2": 558.479, "r_x3": 448.695, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 219, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 499.385, "r_y0": 567.031, "r_x1": 512.117, "r_y1": 567.031, "r_x2": 512.117, "r_y2": 558.479, "r_x3": 499.385, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 220, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.682, "r_y0": 583.988, "r_x1": 384.352, "r_y1": 583.988, "r_x2": 384.352, "r_y2": 575.436, "r_x3": 357.682, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 221, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.901, "r_y0": 583.988, "r_x1": 431.336, "r_y1": 583.988, "r_x2": 431.336, "r_y2": 575.436, "r_x3": 413.901, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 222, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 583.988, "r_x1": 475.599, "r_y1": 583.988, "r_x2": 475.599, "r_y2": 575.436, "r_x3": 458.165, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 223, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.029, "r_y0": 583.988, "r_x1": 514.463, "r_y1": 583.988, "r_x2": 514.463, "r_y2": 575.436, "r_x3": 497.029, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 224, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 350.723, "r_y0": 595.943, "r_x1": 391.311, "r_y1": 595.943, "r_x2": 391.311, "r_y2": 587.391, "r_x3": 350.723, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 225, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 595.943, "r_x1": 431.34, "r_y1": 595.943, "r_x2": 431.34, "r_y2": 587.391, "r_x3": 413.906, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 226, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 595.943, "r_x1": 475.604, "r_y1": 595.943, "r_x2": 475.604, "r_y2": 587.391, "r_x3": 458.17, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 227, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 595.943, "r_x1": 514.468, "r_y1": 595.943, "r_x2": 514.468, "r_y2": 587.391, "r_x3": 497.034, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 228, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.136, "r_y0": 607.899, "r_x1": 387.899, "r_y1": 607.899, "r_x2": 387.899, "r_y2": 599.347, "r_x3": 354.136, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 229, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.902, "r_y0": 607.899, "r_x1": 431.336, "r_y1": 607.899, "r_x2": 431.336, "r_y2": 599.347, "r_x3": 413.902, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 230, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 607.899, "r_x1": 475.6, "r_y1": 607.899, "r_x2": 475.6, "r_y2": 599.347, "r_x3": 458.165, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 231, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.03, "r_y0": 607.899, "r_x1": 514.464, "r_y1": 607.899, "r_x2": 514.464, "r_y2": 599.347, "r_x3": 497.03, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 232, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.559, "r_y0": 619.854, "r_x1": 395.475, "r_y1": 619.854, "r_x2": 395.475, "r_y2": 611.302, "r_x3": 346.559, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 233, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 619.854, "r_x1": 431.341, "r_y1": 619.854, "r_x2": 431.341, "r_y2": 611.302, "r_x3": 413.906, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 234, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 619.854, "r_x1": 475.605, "r_y1": 619.854, "r_x2": 475.605, "r_y2": 611.302, "r_x3": 458.17, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 235, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 619.854, "r_x1": 514.469, "r_y1": 619.854, "r_x2": 514.469, "r_y2": 611.302, "r_x3": 497.034, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 236, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.781, "r_y0": 631.809, "r_x1": 381.254, "r_y1": 631.809, "r_x2": 381.254, "r_y2": 623.2570000000001, "r_x3": 360.781, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 237, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.902, "r_y0": 631.809, "r_x1": 431.336, "r_y1": 631.809, "r_x2": 431.336, "r_y2": 623.2570000000001, "r_x3": 413.902, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 238, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 631.809, "r_x1": 475.6, "r_y1": 631.809, "r_x2": 475.6, "r_y2": 623.2570000000001, "r_x3": 458.165, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 239, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.03, "r_y0": 631.809, "r_x1": 514.464, "r_y1": 631.809, "r_x2": 514.464, "r_y2": 623.2570000000001, "r_x3": 497.03, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 240, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.483, "r_y0": 643.764, "r_x1": 396.551, "r_y1": 643.764, "r_x2": 396.551, "r_y2": 635.212, "r_x3": 345.483, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 241, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 643.764, "r_x1": 431.341, "r_y1": 643.764, "r_x2": 431.341, "r_y2": 635.212, "r_x3": 413.906, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 242, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 643.764, "r_x1": 475.605, "r_y1": 643.764, "r_x2": 475.605, "r_y2": 635.212, "r_x3": 458.17, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 243, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 643.78, "r_x1": 514.469, "r_y1": 643.78, "r_x2": 514.469, "r_y2": 634.8240000000001, "r_x3": 497.034, "r_y3": 634.8240000000001, "coord_origin": "TOPLEFT"}, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 99, "label": "text", "bbox": {"l": 358.011, "t": 552.502, "r": 384.023, "b": 561.054, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 215, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 358.011, "r_y0": 561.054, "r_x1": 384.023, "r_y1": 561.054, "r_x2": 384.023, "r_y2": 552.502, "r_x3": 358.011, "r_y3": 552.502, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 100, "label": "text", "bbox": {"l": 449.034, "t": 546.524, "r": 473.94, "b": 555.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 216, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.034, "r_y0": 555.076, "r_x1": 473.94, "r_y1": 555.076, "r_x2": 473.94, "r_y2": 546.524, "r_x3": 449.034, "r_y3": 546.524, "coord_origin": "TOPLEFT"}, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 101, "label": "text", "bbox": {"l": 408.506, "t": 558.479, "r": 436.74, "b": 567.031, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 217, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.506, "r_y0": 567.031, "r_x1": 436.74, "r_y1": 567.031, "r_x2": 436.74, "r_y2": 558.479, "r_x3": 408.506, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 102, "label": "text", "bbox": {"l": 448.695, "t": 558.479, "r": 485.079, "b": 567.031, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 218, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.695, "r_y0": 567.031, "r_x1": 485.079, "r_y1": 567.031, "r_x2": 485.079, "r_y2": 558.479, "r_x3": 448.695, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 103, "label": "text", "bbox": {"l": 499.385, "t": 558.479, "r": 512.117, "b": 567.031, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 219, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 499.385, "r_y0": 567.031, "r_x1": 512.117, "r_y1": 567.031, "r_x2": 512.117, "r_y2": 558.479, "r_x3": 499.385, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 104, "label": "text", "bbox": {"l": 357.682, "t": 575.436, "r": 384.352, "b": 583.988, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 220, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.682, "r_y0": 583.988, "r_x1": 384.352, "r_y1": 583.988, "r_x2": 384.352, "r_y2": 575.436, "r_x3": 357.682, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 105, "label": "text", "bbox": {"l": 413.901, "t": 575.436, "r": 431.336, "b": 583.988, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 221, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.901, "r_y0": 583.988, "r_x1": 431.336, "r_y1": 583.988, "r_x2": 431.336, "r_y2": 575.436, "r_x3": 413.901, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 106, "label": "text", "bbox": {"l": 458.165, "t": 575.436, "r": 475.599, "b": 583.988, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 222, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 583.988, "r_x1": 475.599, "r_y1": 583.988, "r_x2": 475.599, "r_y2": 575.436, "r_x3": 458.165, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 107, "label": "text", "bbox": {"l": 497.029, "t": 575.436, "r": 514.463, "b": 583.988, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 223, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.029, "r_y0": 583.988, "r_x1": 514.463, "r_y1": 583.988, "r_x2": 514.463, "r_y2": 575.436, "r_x3": 497.029, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 108, "label": "text", "bbox": {"l": 350.723, "t": 587.391, "r": 391.311, "b": 595.943, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 224, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 350.723, "r_y0": 595.943, "r_x1": 391.311, "r_y1": 595.943, "r_x2": 391.311, "r_y2": 587.391, "r_x3": 350.723, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 109, "label": "text", "bbox": {"l": 413.906, "t": 587.391, "r": 431.34, "b": 595.943, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 225, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 595.943, "r_x1": 431.34, "r_y1": 595.943, "r_x2": 431.34, "r_y2": 587.391, "r_x3": 413.906, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 110, "label": "text", "bbox": {"l": 458.17, "t": 587.391, "r": 475.604, "b": 595.943, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 226, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 595.943, "r_x1": 475.604, "r_y1": 595.943, "r_x2": 475.604, "r_y2": 587.391, "r_x3": 458.17, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 111, "label": "text", "bbox": {"l": 497.034, "t": 587.391, "r": 514.468, "b": 595.943, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 227, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 595.943, "r_x1": 514.468, "r_y1": 595.943, "r_x2": 514.468, "r_y2": 587.391, "r_x3": 497.034, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 112, "label": "text", "bbox": {"l": 354.136, "t": 599.347, "r": 387.899, "b": 607.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 228, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.136, "r_y0": 607.899, "r_x1": 387.899, "r_y1": 607.899, "r_x2": 387.899, "r_y2": 599.347, "r_x3": 354.136, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 113, "label": "text", "bbox": {"l": 413.902, "t": 599.347, "r": 431.336, "b": 607.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 229, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.902, "r_y0": 607.899, "r_x1": 431.336, "r_y1": 607.899, "r_x2": 431.336, "r_y2": 599.347, "r_x3": 413.902, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 114, "label": "text", "bbox": {"l": 458.165, "t": 599.347, "r": 475.6, "b": 607.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 230, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 607.899, "r_x1": 475.6, "r_y1": 607.899, "r_x2": 475.6, "r_y2": 599.347, "r_x3": 458.165, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 115, "label": "text", "bbox": {"l": 497.03, "t": 599.347, "r": 514.464, "b": 607.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 231, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.03, "r_y0": 607.899, "r_x1": 514.464, "r_y1": 607.899, "r_x2": 514.464, "r_y2": 599.347, "r_x3": 497.03, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 116, "label": "text", "bbox": {"l": 346.559, "t": 611.302, "r": 395.475, "b": 619.854, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 232, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.559, "r_y0": 619.854, "r_x1": 395.475, "r_y1": 619.854, "r_x2": 395.475, "r_y2": 611.302, "r_x3": 346.559, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 117, "label": "text", "bbox": {"l": 413.906, "t": 611.302, "r": 431.341, "b": 619.854, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 233, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 619.854, "r_x1": 431.341, "r_y1": 619.854, "r_x2": 431.341, "r_y2": 611.302, "r_x3": 413.906, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 118, "label": "text", "bbox": {"l": 458.17, "t": 611.302, "r": 475.605, "b": 619.854, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 234, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 619.854, "r_x1": 475.605, "r_y1": 619.854, "r_x2": 475.605, "r_y2": 611.302, "r_x3": 458.17, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 119, "label": "text", "bbox": {"l": 497.034, "t": 611.302, "r": 514.469, "b": 619.854, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 235, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 619.854, "r_x1": 514.469, "r_y1": 619.854, "r_x2": 514.469, "r_y2": 611.302, "r_x3": 497.034, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 120, "label": "text", "bbox": {"l": 360.781, "t": 623.2570000000001, "r": 381.254, "b": 631.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 236, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.781, "r_y0": 631.809, "r_x1": 381.254, "r_y1": 631.809, "r_x2": 381.254, "r_y2": 623.2570000000001, "r_x3": 360.781, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 121, "label": "text", "bbox": {"l": 413.902, "t": 623.2570000000001, "r": 431.336, "b": 631.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 237, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.902, "r_y0": 631.809, "r_x1": 431.336, "r_y1": 631.809, "r_x2": 431.336, "r_y2": 623.2570000000001, "r_x3": 413.902, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 122, "label": "text", "bbox": {"l": 458.165, "t": 623.2570000000001, "r": 475.6, "b": 631.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 238, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 631.809, "r_x1": 475.6, "r_y1": 631.809, "r_x2": 475.6, "r_y2": 623.2570000000001, "r_x3": 458.165, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 123, "label": "text", "bbox": {"l": 497.03, "t": 623.2570000000001, "r": 514.464, "b": 631.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 239, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.03, "r_y0": 631.809, "r_x1": 514.464, "r_y1": 631.809, "r_x2": 514.464, "r_y2": 623.2570000000001, "r_x3": 497.03, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 124, "label": "text", "bbox": {"l": 345.483, "t": 635.212, "r": 396.551, "b": 643.764, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 240, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.483, "r_y0": 643.764, "r_x1": 396.551, "r_y1": 643.764, "r_x2": 396.551, "r_y2": 635.212, "r_x3": 345.483, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 125, "label": "text", "bbox": {"l": 413.906, "t": 635.212, "r": 431.341, "b": 643.764, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 241, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 643.764, "r_x1": 431.341, "r_y1": 643.764, "r_x2": 431.341, "r_y2": 635.212, "r_x3": 413.906, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 126, "label": "text", "bbox": {"l": 458.17, "t": 635.212, "r": 475.605, "b": 643.764, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 242, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 643.764, "r_x1": 475.605, "r_y1": 643.764, "r_x2": 475.605, "r_y2": 635.212, "r_x3": 458.17, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 127, "label": "text", "bbox": {"l": 497.034, "t": 634.8240000000001, "r": 514.469, "b": 643.78, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 243, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 643.78, "r_x1": 514.469, "r_y1": 643.78, "r_x2": 514.469, "r_y2": 634.8240000000001, "r_x3": 497.034, "r_y3": 634.8240000000001, "coord_origin": "TOPLEFT"}, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 11, "label": "caption", "bbox": {"l": 308.862, "t": 657.13, "r": 545.115, "b": 689.592, "coord_origin": "TOPLEFT"}, "confidence": 0.9541404247283936, "cells": [{"index": 244, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 665.682, "r_x1": 341.739, "r_y1": 665.682, "r_x2": 341.739, "r_y2": 657.13, "r_x3": 308.862, "r_y3": 657.13, "coord_origin": "TOPLEFT"}, "text": "Table 4:", "orig": "Table 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 245, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 349.559, "r_y0": 665.682, "r_x1": 545.115, "r_y1": 665.682, "r_x2": 545.115, "r_y2": 657.13, "r_x3": 349.559, "r_y3": 657.13, "coord_origin": "TOPLEFT"}, "text": "Results of structure with content retrieved using", "orig": "Results of structure with content retrieved using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 246, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 677.637, "r_x1": 425.763, "r_y1": 677.637, "r_x2": 425.763, "r_y2": 669.085, "r_x3": 308.862, "r_y3": 669.085, "coord_origin": "TOPLEFT"}, "text": "cell detection on PubTabNet.", "orig": "cell detection on PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 247, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.336, "r_y0": 677.637, "r_x1": 545.115, "r_y1": 677.637, "r_x2": 545.115, "r_y2": 669.085, "r_x3": 430.336, "r_y3": 669.085, "coord_origin": "TOPLEFT"}, "text": "In all cases the input is PDF", "orig": "In all cases the input is PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 248, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.592, "r_x1": 435.038, "r_y1": 689.592, "r_x2": 435.038, "r_y2": 681.04, "r_x3": 308.862, "r_y3": 681.04, "coord_origin": "TOPLEFT"}, "text": "documents with cropped tables.", "orig": "documents with cropped tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8787972331047058, "cells": [{"index": 249, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {"0": {"label": "table", "id": 0, "page_no": 6, "cluster": {"id": 0, "label": "table", "bbox": {"l": 53.368526458740234, "t": 409.1357727050781, "r": 283.0443420410156, "b": 582.3977661132812, "coord_origin": "TOPLEFT"}, "confidence": 0.9892510175704956, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.843, "r_y0": 429.511, "r_x1": 104.855, "r_y1": 429.511, "r_x2": 104.855, "r_y2": 420.959, "r_x3": 78.843, "r_y3": 420.959, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.2, "r_y0": 423.533, "r_x1": 236.107, "r_y1": 423.533, "r_x2": 236.107, "r_y2": 414.981, "r_x3": 211.2, "r_y3": 414.981, "coord_origin": "TOPLEFT"}, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.338, "r_y0": 435.488, "r_x1": 159.216, "r_y1": 435.488, "r_x2": 159.216, "r_y2": 426.936, "r_x3": 129.338, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.171, "r_y0": 435.488, "r_x1": 199.405, "r_y1": 435.488, "r_x2": 199.405, "r_y2": 426.936, "r_x3": 171.171, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.36, "r_y0": 435.488, "r_x1": 247.744, "r_y1": 435.488, "r_x2": 247.744, "r_y2": 426.936, "r_x3": 211.36, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.54, "r_y0": 435.488, "r_x1": 277.273, "r_y1": 435.488, "r_x2": 277.273, "r_y2": 426.936, "r_x3": 264.54, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 452.445, "r_x1": 102.085, "r_y1": 452.445, "r_x2": 102.085, "r_y2": 443.893, "r_x3": 81.612, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.872, "r_y0": 452.445, "r_x1": 153.691, "r_y1": 452.445, "r_x2": 153.691, "r_y2": 443.893, "r_x3": 134.872, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 452.445, "r_x1": 194.0, "r_y1": 452.445, "r_x2": 194.0, "r_y2": 443.893, "r_x3": 176.566, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.829, "r_y0": 452.445, "r_x1": 238.264, "r_y1": 452.445, "r_x2": 238.264, "r_y2": 443.893, "r_x3": 220.829, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 452.445, "r_x1": 279.619, "r_y1": 452.445, "r_x2": 279.619, "r_y2": 443.893, "r_x3": 262.184, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.165, "r_y0": 464.401, "r_x1": 101.532, "r_y1": 464.401, "r_x2": 101.532, "r_y2": 455.849, "r_x3": 82.165, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.867, "r_y0": 464.401, "r_x1": 153.687, "r_y1": 464.401, "r_x2": 153.687, "r_y2": 455.849, "r_x3": 134.867, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.624, "r_y0": 464.401, "r_x1": 186.942, "r_y1": 464.401, "r_x2": 186.942, "r_y2": 455.849, "r_x3": 183.624, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 464.401, "r_x1": 231.205, "r_y1": 464.401, "r_x2": 231.205, "r_y2": 455.849, "r_x3": 227.888, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.699, "r_y0": 464.401, "r_x1": 282.114, "r_y1": 464.401, "r_x2": 282.114, "r_y2": 455.849, "r_x3": 259.699, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 476.954, "r_x1": 117.383, "r_y1": 476.954, "r_x2": 117.383, "r_y2": 468.402, "r_x3": 66.315, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 476.954, "r_x1": 153.687, "r_y1": 476.954, "r_x2": 153.687, "r_y2": 468.402, "r_x3": 134.868, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 476.954, "r_x1": 194.006, "r_y1": 476.954, "r_x2": 194.006, "r_y2": 468.402, "r_x3": 176.571, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 476.954, "r_x1": 238.269, "r_y1": 476.954, "r_x2": 238.269, "r_y2": 468.402, "r_x3": 220.835, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.698, "r_y0": 476.97, "r_x1": 282.114, "r_y1": 476.97, "r_x2": 282.114, "r_y2": 468.014, "r_x3": 259.698, "r_y3": 468.014, "coord_origin": "TOPLEFT"}, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 492.147, "r_x1": 102.085, "r_y1": 492.147, "r_x2": 102.085, "r_y2": 483.595, "r_x3": 81.612, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.872, "r_y0": 492.147, "r_x1": 153.691, "r_y1": 492.147, "r_x2": 153.691, "r_y2": 483.595, "r_x3": 134.872, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 492.147, "r_x1": 194.0, "r_y1": 492.147, "r_x2": 194.0, "r_y2": 483.595, "r_x3": 176.566, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 218.339, "r_y0": 492.147, "r_x1": 240.755, "r_y1": 492.147, "r_x2": 240.755, "r_y2": 483.595, "r_x3": 218.339, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 492.147, "r_x1": 279.619, "r_y1": 492.147, "r_x2": 279.619, "r_y2": 483.595, "r_x3": 262.184, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.165, "r_y0": 504.102, "r_x1": 101.532, "r_y1": 504.102, "r_x2": 101.532, "r_y2": 495.55, "r_x3": 82.165, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.867, "r_y0": 504.102, "r_x1": 153.687, "r_y1": 504.102, "r_x2": 153.687, "r_y2": 495.55, "r_x3": 134.867, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.624, "r_y0": 504.102, "r_x1": 186.942, "r_y1": 504.102, "r_x2": 186.942, "r_y2": 495.55, "r_x3": 183.624, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 504.102, "r_x1": 231.205, "r_y1": 504.102, "r_x2": 231.205, "r_y2": 495.55, "r_x3": 227.888, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.699, "r_y0": 504.102, "r_x1": 282.114, "r_y1": 504.102, "r_x2": 282.114, "r_y2": 495.55, "r_x3": 259.699, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 71.789, "r_y0": 516.057, "r_x1": 111.908, "r_y1": 516.057, "r_x2": 111.908, "r_y2": 507.505, "r_x3": 71.789, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.862, "r_y0": 516.057, "r_x1": 153.682, "r_y1": 516.057, "r_x2": 153.682, "r_y2": 507.505, "r_x3": 134.862, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.629, "r_y0": 516.057, "r_x1": 186.947, "r_y1": 516.057, "r_x2": 186.947, "r_y2": 507.505, "r_x3": 183.629, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.893, "r_y0": 516.057, "r_x1": 231.211, "r_y1": 516.057, "r_x2": 231.211, "r_y2": 507.505, "r_x3": 227.893, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.694, "r_y0": 516.057, "r_x1": 282.109, "r_y1": 516.057, "r_x2": 282.109, "r_y2": 507.505, "r_x3": 259.694, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 528.012, "r_x1": 117.383, "r_y1": 528.012, "r_x2": 117.383, "r_y2": 519.46, "r_x3": 66.315, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 528.012, "r_x1": 153.687, "r_y1": 528.012, "r_x2": 153.687, "r_y2": 519.46, "r_x3": 134.868, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 528.012, "r_x1": 194.006, "r_y1": 528.012, "r_x2": 194.006, "r_y2": 519.46, "r_x3": 176.571, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 528.012, "r_x1": 238.269, "r_y1": 528.012, "r_x2": 238.269, "r_y2": 519.46, "r_x3": 220.835, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.189, "r_y0": 528.028, "r_x1": 279.624, "r_y1": 528.028, "r_x2": 279.624, "r_y2": 519.072, "r_x3": 262.189, "r_y3": 519.072, "coord_origin": "TOPLEFT"}, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 545.319, "r_x1": 102.085, "r_y1": 545.319, "r_x2": 102.085, "r_y2": 536.767, "r_x3": 81.612, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.911, "r_y0": 545.319, "r_x1": 150.643, "r_y1": 545.319, "r_x2": 150.643, "r_y2": 536.767, "r_x3": 137.911, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 545.319, "r_x1": 194.0, "r_y1": 545.319, "r_x2": 194.0, "r_y2": 536.767, "r_x3": 176.566, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.893, "r_y0": 545.319, "r_x1": 231.21, "r_y1": 545.319, "r_x2": 231.21, "r_y2": 536.767, "r_x3": 227.893, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 545.319, "r_x1": 279.619, "r_y1": 545.319, "r_x2": 279.619, "r_y2": 536.767, "r_x3": 262.184, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 557.275, "r_x1": 117.383, "r_y1": 557.275, "r_x2": 117.383, "r_y2": 548.723, "r_x3": 66.315, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.906, "r_y0": 557.275, "r_x1": 150.638, "r_y1": 557.275, "r_x2": 150.638, "r_y2": 548.723, "r_x3": 137.906, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 557.275, "r_x1": 194.006, "r_y1": 557.275, "r_x2": 194.006, "r_y2": 548.723, "r_x3": 176.571, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 557.275, "r_x1": 231.206, "r_y1": 557.275, "r_x2": 231.206, "r_y2": 548.723, "r_x3": 227.888, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.189, "r_y0": 557.2909999999999, "r_x1": 279.624, "r_y1": 557.2909999999999, "r_x2": 279.624, "r_y2": 548.335, "r_x3": 262.189, "r_y3": 548.335, "coord_origin": "TOPLEFT"}, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 576.823, "r_x1": 117.383, "r_y1": 576.823, "r_x2": 117.383, "r_y2": 568.271, "r_x3": 66.315, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 576.823, "r_x1": 153.687, "r_y1": 576.823, "r_x2": 153.687, "r_y2": 568.271, "r_x3": 134.868, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 576.823, "r_x1": 194.006, "r_y1": 576.823, "r_x2": 194.006, "r_y2": 568.271, "r_x3": 176.571, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 576.823, "r_x1": 238.269, "r_y1": 576.823, "r_x2": 238.269, "r_y2": 568.271, "r_x3": 220.835, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.19, "r_y0": 576.823, "r_x1": 279.624, "r_y1": 576.823, "r_x2": 279.624, "r_y2": 568.271, "r_x3": 262.19, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 27, "label": "text", "bbox": {"l": 78.843, "t": 420.959, "r": 104.855, "b": 429.511, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.843, "r_y0": 429.511, "r_x1": 104.855, "r_y1": 429.511, "r_x2": 104.855, "r_y2": 420.959, "r_x3": 78.843, "r_y3": 420.959, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 211.2, "t": 414.981, "r": 236.107, "b": 423.533, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.2, "r_y0": 423.533, "r_x1": 236.107, "r_y1": 423.533, "r_x2": 236.107, "r_y2": 414.981, "r_x3": 211.2, "r_y3": 414.981, "coord_origin": "TOPLEFT"}, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 129.338, "t": 426.936, "r": 159.216, "b": 435.488, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.338, "r_y0": 435.488, "r_x1": 159.216, "r_y1": 435.488, "r_x2": 159.216, "r_y2": 426.936, "r_x3": 129.338, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 171.171, "t": 426.936, "r": 199.405, "b": 435.488, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.171, "r_y0": 435.488, "r_x1": 199.405, "r_y1": 435.488, "r_x2": 199.405, "r_y2": 426.936, "r_x3": 171.171, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 211.36, "t": 426.936, "r": 247.744, "b": 435.488, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.36, "r_y0": 435.488, "r_x1": 247.744, "r_y1": 435.488, "r_x2": 247.744, "r_y2": 426.936, "r_x3": 211.36, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 264.54, "t": 426.936, "r": 277.273, "b": 435.488, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.54, "r_y0": 435.488, "r_x1": 277.273, "r_y1": 435.488, "r_x2": 277.273, "r_y2": 426.936, "r_x3": 264.54, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 81.612, "t": 443.893, "r": 102.085, "b": 452.445, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 452.445, "r_x1": 102.085, "r_y1": 452.445, "r_x2": 102.085, "r_y2": 443.893, "r_x3": 81.612, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 134.872, "t": 443.893, "r": 153.691, "b": 452.445, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.872, "r_y0": 452.445, "r_x1": 153.691, "r_y1": 452.445, "r_x2": 153.691, "r_y2": 443.893, "r_x3": 134.872, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 176.566, "t": 443.893, "r": 194.0, "b": 452.445, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 452.445, "r_x1": 194.0, "r_y1": 452.445, "r_x2": 194.0, "r_y2": 443.893, "r_x3": 176.566, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 220.829, "t": 443.893, "r": 238.264, "b": 452.445, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.829, "r_y0": 452.445, "r_x1": 238.264, "r_y1": 452.445, "r_x2": 238.264, "r_y2": 443.893, "r_x3": 220.829, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 262.184, "t": 443.893, "r": 279.619, "b": 452.445, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 452.445, "r_x1": 279.619, "r_y1": 452.445, "r_x2": 279.619, "r_y2": 443.893, "r_x3": 262.184, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 82.165, "t": 455.849, "r": 101.532, "b": 464.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.165, "r_y0": 464.401, "r_x1": 101.532, "r_y1": 464.401, "r_x2": 101.532, "r_y2": 455.849, "r_x3": 82.165, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 134.867, "t": 455.849, "r": 153.687, "b": 464.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.867, "r_y0": 464.401, "r_x1": 153.687, "r_y1": 464.401, "r_x2": 153.687, "r_y2": 455.849, "r_x3": 134.867, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 183.624, "t": 455.849, "r": 186.942, "b": 464.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.624, "r_y0": 464.401, "r_x1": 186.942, "r_y1": 464.401, "r_x2": 186.942, "r_y2": 455.849, "r_x3": 183.624, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 227.888, "t": 455.849, "r": 231.205, "b": 464.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 464.401, "r_x1": 231.205, "r_y1": 464.401, "r_x2": 231.205, "r_y2": 455.849, "r_x3": 227.888, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 259.699, "t": 455.849, "r": 282.114, "b": 464.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.699, "r_y0": 464.401, "r_x1": 282.114, "r_y1": 464.401, "r_x2": 282.114, "r_y2": 455.849, "r_x3": 259.699, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 66.315, "t": 468.402, "r": 117.383, "b": 476.954, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 476.954, "r_x1": 117.383, "r_y1": 476.954, "r_x2": 117.383, "r_y2": 468.402, "r_x3": 66.315, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 134.868, "t": 468.402, "r": 153.687, "b": 476.954, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 476.954, "r_x1": 153.687, "r_y1": 476.954, "r_x2": 153.687, "r_y2": 468.402, "r_x3": 134.868, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 176.571, "t": 468.402, "r": 194.006, "b": 476.954, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 476.954, "r_x1": 194.006, "r_y1": 476.954, "r_x2": 194.006, "r_y2": 468.402, "r_x3": 176.571, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 220.835, "t": 468.402, "r": 238.269, "b": 476.954, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 476.954, "r_x1": 238.269, "r_y1": 476.954, "r_x2": 238.269, "r_y2": 468.402, "r_x3": 220.835, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 259.698, "t": 468.014, "r": 282.114, "b": 476.97, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.698, "r_y0": 476.97, "r_x1": 282.114, "r_y1": 476.97, "r_x2": 282.114, "r_y2": 468.014, "r_x3": 259.698, "r_y3": 468.014, "coord_origin": "TOPLEFT"}, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 81.612, "t": 483.595, "r": 102.085, "b": 492.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 492.147, "r_x1": 102.085, "r_y1": 492.147, "r_x2": 102.085, "r_y2": 483.595, "r_x3": 81.612, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 134.872, "t": 483.595, "r": 153.691, "b": 492.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.872, "r_y0": 492.147, "r_x1": 153.691, "r_y1": 492.147, "r_x2": 153.691, "r_y2": 483.595, "r_x3": 134.872, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 176.566, "t": 483.595, "r": 194.0, "b": 492.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 492.147, "r_x1": 194.0, "r_y1": 492.147, "r_x2": 194.0, "r_y2": 483.595, "r_x3": 176.566, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 218.339, "t": 483.595, "r": 240.755, "b": 492.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 218.339, "r_y0": 492.147, "r_x1": 240.755, "r_y1": 492.147, "r_x2": 240.755, "r_y2": 483.595, "r_x3": 218.339, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 262.184, "t": 483.595, "r": 279.619, "b": 492.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 492.147, "r_x1": 279.619, "r_y1": 492.147, "r_x2": 279.619, "r_y2": 483.595, "r_x3": 262.184, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 82.165, "t": 495.55, "r": 101.532, "b": 504.102, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.165, "r_y0": 504.102, "r_x1": 101.532, "r_y1": 504.102, "r_x2": 101.532, "r_y2": 495.55, "r_x3": 82.165, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 134.867, "t": 495.55, "r": 153.687, "b": 504.102, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.867, "r_y0": 504.102, "r_x1": 153.687, "r_y1": 504.102, "r_x2": 153.687, "r_y2": 495.55, "r_x3": 134.867, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 183.624, "t": 495.55, "r": 186.942, "b": 504.102, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.624, "r_y0": 504.102, "r_x1": 186.942, "r_y1": 504.102, "r_x2": 186.942, "r_y2": 495.55, "r_x3": 183.624, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 227.888, "t": 495.55, "r": 231.205, "b": 504.102, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 504.102, "r_x1": 231.205, "r_y1": 504.102, "r_x2": 231.205, "r_y2": 495.55, "r_x3": 227.888, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 259.699, "t": 495.55, "r": 282.114, "b": 504.102, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.699, "r_y0": 504.102, "r_x1": 282.114, "r_y1": 504.102, "r_x2": 282.114, "r_y2": 495.55, "r_x3": 259.699, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 71.789, "t": 507.505, "r": 111.908, "b": 516.057, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 71.789, "r_y0": 516.057, "r_x1": 111.908, "r_y1": 516.057, "r_x2": 111.908, "r_y2": 507.505, "r_x3": 71.789, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 134.862, "t": 507.505, "r": 153.682, "b": 516.057, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.862, "r_y0": 516.057, "r_x1": 153.682, "r_y1": 516.057, "r_x2": 153.682, "r_y2": 507.505, "r_x3": 134.862, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 183.629, "t": 507.505, "r": 186.947, "b": 516.057, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.629, "r_y0": 516.057, "r_x1": 186.947, "r_y1": 516.057, "r_x2": 186.947, "r_y2": 507.505, "r_x3": 183.629, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 227.893, "t": 507.505, "r": 231.211, "b": 516.057, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.893, "r_y0": 516.057, "r_x1": 231.211, "r_y1": 516.057, "r_x2": 231.211, "r_y2": 507.505, "r_x3": 227.893, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 259.694, "t": 507.505, "r": 282.109, "b": 516.057, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.694, "r_y0": 516.057, "r_x1": 282.109, "r_y1": 516.057, "r_x2": 282.109, "r_y2": 507.505, "r_x3": 259.694, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 66.315, "t": 519.46, "r": 117.383, "b": 528.012, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 528.012, "r_x1": 117.383, "r_y1": 528.012, "r_x2": 117.383, "r_y2": 519.46, "r_x3": 66.315, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 134.868, "t": 519.46, "r": 153.687, "b": 528.012, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 528.012, "r_x1": 153.687, "r_y1": 528.012, "r_x2": 153.687, "r_y2": 519.46, "r_x3": 134.868, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 176.571, "t": 519.46, "r": 194.006, "b": 528.012, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 528.012, "r_x1": 194.006, "r_y1": 528.012, "r_x2": 194.006, "r_y2": 519.46, "r_x3": 176.571, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 220.835, "t": 519.46, "r": 238.269, "b": 528.012, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 528.012, "r_x1": 238.269, "r_y1": 528.012, "r_x2": 238.269, "r_y2": 519.46, "r_x3": 220.835, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 262.189, "t": 519.072, "r": 279.624, "b": 528.028, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.189, "r_y0": 528.028, "r_x1": 279.624, "r_y1": 528.028, "r_x2": 279.624, "r_y2": 519.072, "r_x3": 262.189, "r_y3": 519.072, "coord_origin": "TOPLEFT"}, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 81.612, "t": 536.767, "r": 102.085, "b": 545.319, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 545.319, "r_x1": 102.085, "r_y1": 545.319, "r_x2": 102.085, "r_y2": 536.767, "r_x3": 81.612, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 137.911, "t": 536.767, "r": 150.643, "b": 545.319, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.911, "r_y0": 545.319, "r_x1": 150.643, "r_y1": 545.319, "r_x2": 150.643, "r_y2": 536.767, "r_x3": 137.911, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 176.566, "t": 536.767, "r": 194.0, "b": 545.319, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 545.319, "r_x1": 194.0, "r_y1": 545.319, "r_x2": 194.0, "r_y2": 536.767, "r_x3": 176.566, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 227.893, "t": 536.767, "r": 231.21, "b": 545.319, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.893, "r_y0": 545.319, "r_x1": 231.21, "r_y1": 545.319, "r_x2": 231.21, "r_y2": 536.767, "r_x3": 227.893, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 262.184, "t": 536.767, "r": 279.619, "b": 545.319, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 545.319, "r_x1": 279.619, "r_y1": 545.319, "r_x2": 279.619, "r_y2": 536.767, "r_x3": 262.184, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 66.315, "t": 548.723, "r": 117.383, "b": 557.275, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 557.275, "r_x1": 117.383, "r_y1": 557.275, "r_x2": 117.383, "r_y2": 548.723, "r_x3": 66.315, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 137.906, "t": 548.723, "r": 150.638, "b": 557.275, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.906, "r_y0": 557.275, "r_x1": 150.638, "r_y1": 557.275, "r_x2": 150.638, "r_y2": 548.723, "r_x3": 137.906, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 176.571, "t": 548.723, "r": 194.006, "b": 557.275, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 557.275, "r_x1": 194.006, "r_y1": 557.275, "r_x2": 194.006, "r_y2": 548.723, "r_x3": 176.571, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 227.888, "t": 548.723, "r": 231.206, "b": 557.275, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 557.275, "r_x1": 231.206, "r_y1": 557.275, "r_x2": 231.206, "r_y2": 548.723, "r_x3": 227.888, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 262.189, "t": 548.335, "r": 279.624, "b": 557.2909999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.189, "r_y0": 557.2909999999999, "r_x1": 279.624, "r_y1": 557.2909999999999, "r_x2": 279.624, "r_y2": 548.335, "r_x3": 262.189, "r_y3": 548.335, "coord_origin": "TOPLEFT"}, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 66.315, "t": 568.271, "r": 117.383, "b": 576.823, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 576.823, "r_x1": 117.383, "r_y1": 576.823, "r_x2": 117.383, "r_y2": 568.271, "r_x3": 66.315, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 134.868, "t": 568.271, "r": 153.687, "b": 576.823, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 576.823, "r_x1": 153.687, "r_y1": 576.823, "r_x2": 153.687, "r_y2": 568.271, "r_x3": 134.868, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 176.571, "t": 568.271, "r": 194.006, "b": 576.823, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 576.823, "r_x1": 194.006, "r_y1": 576.823, "r_x2": 194.006, "r_y2": 568.271, "r_x3": 176.571, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 220.835, "t": 568.271, "r": 238.269, "b": 576.823, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 576.823, "r_x1": 238.269, "r_y1": 576.823, "r_x2": 238.269, "r_y2": 568.271, "r_x3": 220.835, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 82, "label": "text", "bbox": {"l": 262.19, "t": 568.271, "r": 279.624, "b": 576.823, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.19, "r_y0": 576.823, "r_x1": 279.624, "r_y1": 576.823, "r_x2": 279.624, "r_y2": 568.271, "r_x3": 262.19, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 11, "num_cols": 5, "table_cells": [{"bbox": {"l": 78.843, "t": 420.959, "r": 104.855, "b": 429.511, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 211.2, "t": 414.981, "r": 247.744, "b": 435.488, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "TEDS Complex", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 129.338, "t": 426.936, "r": 159.216, "b": 435.488, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Dataset", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 171.171, "t": 426.936, "r": 199.405, "b": 435.488, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Simple", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 264.54, "t": 426.936, "r": 277.273, "b": 435.488, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "All", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 81.612, "t": 443.893, "r": 102.085, "b": 452.445, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.872, "t": 443.893, "r": 153.691, "b": 452.445, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.566, "t": 443.893, "r": 194.0, "b": 452.445, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "91.1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.829, "t": 443.893, "r": 238.264, "b": 452.445, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "88.7", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 262.184, "t": 443.893, "r": 279.619, "b": 452.445, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "89.9", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 82.165, "t": 455.849, "r": 101.532, "b": 464.401, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.867, "t": 455.849, "r": 153.687, "b": 464.401, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 183.624, "t": 455.849, "r": 186.942, "b": 464.401, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 227.888, "t": 455.849, "r": 231.205, "b": 464.401, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 259.699, "t": 455.849, "r": 282.114, "b": 464.401, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "93.01", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 66.315, "t": 468.402, "r": 117.383, "b": 476.954, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.868, "t": 468.402, "r": 153.687, "b": 476.954, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.571, "t": 468.402, "r": 194.006, "b": 476.954, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "98.5", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.835, "t": 468.402, "r": 238.269, "b": 476.954, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "95.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 259.698, "t": 468.014, "r": 282.114, "b": 476.97, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.75", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 81.612, "t": 483.595, "r": 102.085, "b": 492.147, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.872, "t": 483.595, "r": 153.691, "b": 492.147, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.566, "t": 483.595, "r": 194.0, "b": 492.147, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "88.4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 218.339, "t": 483.595, "r": 240.755, "b": 492.147, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "92.08", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 262.184, "t": 483.595, "r": 279.619, "b": 492.147, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "90.6", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 82.165, "t": 495.55, "r": 101.532, "b": 504.102, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.867, "t": 495.55, "r": 153.687, "b": 504.102, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 183.624, "t": 495.55, "r": 186.942, "b": 504.102, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 227.888, "t": 495.55, "r": 231.205, "b": 504.102, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 259.699, "t": 495.55, "r": 282.114, "b": 504.102, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "87.14", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 71.789, "t": 507.505, "r": 111.908, "b": 516.057, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE (FT)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.862, "t": 507.505, "r": 153.682, "b": 516.057, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 183.629, "t": 507.505, "r": 186.947, "b": 516.057, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 227.893, "t": 507.505, "r": 231.211, "b": 516.057, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 259.694, "t": 507.505, "r": 282.109, "b": 516.057, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "91.02", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 66.315, "t": 519.46, "r": 117.383, "b": 528.012, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.868, "t": 519.46, "r": 153.687, "b": 528.012, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.571, "t": 519.46, "r": 194.006, "b": 528.012, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "97.5", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.835, "t": 519.46, "r": 238.269, "b": 528.012, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "96.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 262.189, "t": 519.072, "r": 279.624, "b": 528.028, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.8", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 81.612, "t": 536.767, "r": 102.085, "b": 545.319, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 137.911, "t": 536.767, "r": 150.643, "b": 545.319, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "TB", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.566, "t": 536.767, "r": 194.0, "b": 545.319, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "86.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 227.893, "t": 536.767, "r": 231.21, "b": 545.319, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 262.184, "t": 536.767, "r": 279.619, "b": 545.319, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "86.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 66.315, "t": 548.723, "r": 117.383, "b": 557.275, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 137.906, "t": 548.723, "r": 150.638, "b": 557.275, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "TB", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.571, "t": 548.723, "r": 194.006, "b": 557.275, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "89.6", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 227.888, "t": 548.723, "r": 231.206, "b": 557.275, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 262.189, "t": 548.335, "r": 279.624, "b": 557.2909999999999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "89.6", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 66.315, "t": 568.271, "r": 117.383, "b": 576.823, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.868, "t": 568.271, "r": 153.687, "b": 576.823, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "STN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.571, "t": 568.271, "r": 194.006, "b": 576.823, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "96.9", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.835, "t": 568.271, "r": 238.269, "b": 576.823, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "95.7", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 262.19, "t": 568.271, "r": 279.624, "b": 576.823, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.7", "column_header": false, "row_header": false, "row_section": false}]}, "8": {"label": "table", "id": 8, "page_no": 6, "cluster": {"id": 8, "label": "table", "bbox": {"l": 308.4068603515625, "t": 247.87631225585938, "r": 533.6419677734375, "b": 303.8056640625, "coord_origin": "TOPLEFT"}, "confidence": 0.9691730737686157, "cells": [{"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.323, "r_y0": 262.485, "r_x1": 365.335, "r_y1": 262.485, "r_x2": 365.335, "r_y2": 253.933, "r_x3": 339.323, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.041, "r_y0": 262.485, "r_x1": 430.919, "r_y1": 262.485, "r_x2": 430.919, "r_y2": 253.933, "r_x3": 401.041, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.102, "r_y0": 262.485, "r_x1": 474.585, "r_y1": 262.485, "r_x2": 474.585, "r_y2": 253.933, "r_x3": 454.102, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 486.54, "r_y0": 262.485, "r_x1": 527.228, "r_y1": 262.485, "r_x2": 527.228, "r_y2": 253.933, "r_x3": 486.54, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.656, "r_y0": 279.442, "r_x1": 377.001, "r_y1": 279.442, "r_x2": 377.001, "r_y2": 270.89, "r_x3": 327.656, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.698, "r_y0": 279.442, "r_x1": 438.281, "r_y1": 279.442, "r_x2": 438.281, "r_y2": 270.89, "r_x3": 393.698, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.636, "r_y0": 279.442, "r_x1": 473.07, "r_y1": 279.442, "r_x2": 473.07, "r_y2": 270.89, "r_x3": 455.636, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.166, "r_y0": 279.442, "r_x1": 515.6, "r_y1": 279.442, "r_x2": 515.6, "r_y2": 270.89, "r_x3": 498.166, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 291.397, "r_x1": 377.863, "r_y1": 291.397, "r_x2": 377.863, "r_y2": 282.845, "r_x3": 326.795, "r_y3": 282.845, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.694, "r_y0": 291.397, "r_x1": 438.276, "r_y1": 291.397, "r_x2": 438.276, "r_y2": 282.845, "r_x3": 393.694, "r_y3": 282.845, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.631, "r_y0": 291.413, "r_x1": 473.066, "r_y1": 291.413, "r_x2": 473.066, "r_y2": 282.457, "r_x3": 455.631, "r_y3": 282.457, "coord_origin": "TOPLEFT"}, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.171, "r_y0": 291.413, "r_x1": 515.606, "r_y1": 291.413, "r_x2": 515.606, "r_y2": 282.457, "r_x3": 498.171, "r_y3": 282.457, "coord_origin": "TOPLEFT"}, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 303.352, "r_x1": 377.863, "r_y1": 303.352, "r_x2": 377.863, "r_y2": 294.8, "r_x3": 326.795, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 389.818, "r_y0": 303.352, "r_x1": 442.152, "r_y1": 303.352, "r_x2": 442.152, "r_y2": 294.8, "r_x3": 389.818, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.631, "r_y0": 303.352, "r_x1": 473.066, "r_y1": 303.352, "r_x2": 473.066, "r_y2": 294.8, "r_x3": 455.631, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 505.225, "r_y0": 303.352, "r_x1": 508.543, "r_y1": 303.352, "r_x2": 508.543, "r_y2": 294.8, "r_x3": 505.225, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 83, "label": "text", "bbox": {"l": 339.323, "t": 253.933, "r": 365.335, "b": 262.485, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.323, "r_y0": 262.485, "r_x1": 365.335, "r_y1": 262.485, "r_x2": 365.335, "r_y2": 253.933, "r_x3": 339.323, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 401.041, "t": 253.933, "r": 430.919, "b": 262.485, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.041, "r_y0": 262.485, "r_x1": 430.919, "r_y1": 262.485, "r_x2": 430.919, "r_y2": 253.933, "r_x3": 401.041, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 454.102, "t": 253.933, "r": 474.585, "b": 262.485, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.102, "r_y0": 262.485, "r_x1": 474.585, "r_y1": 262.485, "r_x2": 474.585, "r_y2": 253.933, "r_x3": 454.102, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 86, "label": "text", "bbox": {"l": 486.54, "t": 253.933, "r": 527.228, "b": 262.485, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 486.54, "r_y0": 262.485, "r_x1": 527.228, "r_y1": 262.485, "r_x2": 527.228, "r_y2": 253.933, "r_x3": 486.54, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 327.656, "t": 270.89, "r": 377.001, "b": 279.442, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.656, "r_y0": 279.442, "r_x1": 377.001, "r_y1": 279.442, "r_x2": 377.001, "r_y2": 270.89, "r_x3": 327.656, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 88, "label": "text", "bbox": {"l": 393.698, "t": 270.89, "r": 438.281, "b": 279.442, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.698, "r_y0": 279.442, "r_x1": 438.281, "r_y1": 279.442, "r_x2": 438.281, "r_y2": 270.89, "r_x3": 393.698, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 455.636, "t": 270.89, "r": 473.07, "b": 279.442, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.636, "r_y0": 279.442, "r_x1": 473.07, "r_y1": 279.442, "r_x2": 473.07, "r_y2": 270.89, "r_x3": 455.636, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 498.166, "t": 270.89, "r": 515.6, "b": 279.442, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.166, "r_y0": 279.442, "r_x1": 515.6, "r_y1": 279.442, "r_x2": 515.6, "r_y2": 270.89, "r_x3": 498.166, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 91, "label": "text", "bbox": {"l": 326.795, "t": 282.845, "r": 377.863, "b": 291.397, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 291.397, "r_x1": 377.863, "r_y1": 291.397, "r_x2": 377.863, "r_y2": 282.845, "r_x3": 326.795, "r_y3": 282.845, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 92, "label": "text", "bbox": {"l": 393.694, "t": 282.845, "r": 438.276, "b": 291.397, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.694, "r_y0": 291.397, "r_x1": 438.276, "r_y1": 291.397, "r_x2": 438.276, "r_y2": 282.845, "r_x3": 393.694, "r_y3": 282.845, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 93, "label": "text", "bbox": {"l": 455.631, "t": 282.457, "r": 473.066, "b": 291.413, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.631, "r_y0": 291.413, "r_x1": 473.066, "r_y1": 291.413, "r_x2": 473.066, "r_y2": 282.457, "r_x3": 455.631, "r_y3": 282.457, "coord_origin": "TOPLEFT"}, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 94, "label": "text", "bbox": {"l": 498.171, "t": 282.457, "r": 515.606, "b": 291.413, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.171, "r_y0": 291.413, "r_x1": 515.606, "r_y1": 291.413, "r_x2": 515.606, "r_y2": 282.457, "r_x3": 498.171, "r_y3": 282.457, "coord_origin": "TOPLEFT"}, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 95, "label": "text", "bbox": {"l": 326.795, "t": 294.8, "r": 377.863, "b": 303.352, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 303.352, "r_x1": 377.863, "r_y1": 303.352, "r_x2": 377.863, "r_y2": 294.8, "r_x3": 326.795, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 96, "label": "text", "bbox": {"l": 389.818, "t": 294.8, "r": 442.152, "b": 303.352, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 389.818, "r_y0": 303.352, "r_x1": 442.152, "r_y1": 303.352, "r_x2": 442.152, "r_y2": 294.8, "r_x3": 389.818, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 97, "label": "text", "bbox": {"l": 455.631, "t": 294.8, "r": 473.066, "b": 303.352, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.631, "r_y0": 303.352, "r_x1": 473.066, "r_y1": 303.352, "r_x2": 473.066, "r_y2": 294.8, "r_x3": 455.631, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 98, "label": "text", "bbox": {"l": 505.225, "t": 294.8, "r": 508.543, "b": 303.352, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 505.225, "r_y0": 303.352, "r_x1": 508.543, "r_y1": 303.352, "r_x2": 508.543, "r_y2": 294.8, "r_x3": 505.225, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 4, "num_cols": 4, "table_cells": [{"bbox": {"l": 339.323, "t": 253.933, "r": 365.335, "b": 262.485, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 401.041, "t": 253.933, "r": 430.919, "b": 262.485, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Dataset", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 454.102, "t": 253.933, "r": 474.585, "b": 262.485, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "mAP", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 486.54, "t": 253.933, "r": 527.228, "b": 262.485, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "mAP (PP)", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 327.656, "t": 270.89, "r": 377.001, "b": 279.442, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD+BBox", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 393.698, "t": 270.89, "r": 438.281, "b": 279.442, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 455.636, "t": 270.89, "r": 473.07, "b": 279.442, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "79.2", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 498.166, "t": 270.89, "r": 515.6, "b": 279.442, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "82.7", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 326.795, "t": 282.845, "r": 377.863, "b": 291.397, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 393.694, "t": 282.845, "r": 438.276, "b": 291.397, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 455.631, "t": 282.457, "r": 473.066, "b": 291.413, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "82.1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 498.171, "t": 282.457, "r": 515.606, "b": 291.413, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "86.8", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 326.795, "t": 294.8, "r": 377.863, "b": 303.352, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 389.818, "t": 294.8, "r": 442.152, "b": 303.352, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "SynthTabNet", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 455.631, "t": 294.8, "r": 473.066, "b": 303.352, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "87.7", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 505.225, "t": 294.8, "r": 508.543, "b": 303.352, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false}]}, "5": {"label": "table", "id": 5, "page_no": 6, "cluster": {"id": 5, "label": "table", "bbox": {"l": 332.9688720703125, "t": 540.2835693359375, "r": 520.942138671875, "b": 643.2697143554688, "coord_origin": "TOPLEFT"}, "confidence": 0.9775567650794983, "cells": [{"index": 215, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 358.011, "r_y0": 561.054, "r_x1": 384.023, "r_y1": 561.054, "r_x2": 384.023, "r_y2": 552.502, "r_x3": 358.011, "r_y3": 552.502, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 216, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.034, "r_y0": 555.076, "r_x1": 473.94, "r_y1": 555.076, "r_x2": 473.94, "r_y2": 546.524, "r_x3": 449.034, "r_y3": 546.524, "coord_origin": "TOPLEFT"}, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 217, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.506, "r_y0": 567.031, "r_x1": 436.74, "r_y1": 567.031, "r_x2": 436.74, "r_y2": 558.479, "r_x3": 408.506, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 218, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.695, "r_y0": 567.031, "r_x1": 485.079, "r_y1": 567.031, "r_x2": 485.079, "r_y2": 558.479, "r_x3": 448.695, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 219, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 499.385, "r_y0": 567.031, "r_x1": 512.117, "r_y1": 567.031, "r_x2": 512.117, "r_y2": 558.479, "r_x3": 499.385, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 220, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.682, "r_y0": 583.988, "r_x1": 384.352, "r_y1": 583.988, "r_x2": 384.352, "r_y2": 575.436, "r_x3": 357.682, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 221, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.901, "r_y0": 583.988, "r_x1": 431.336, "r_y1": 583.988, "r_x2": 431.336, "r_y2": 575.436, "r_x3": 413.901, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 222, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 583.988, "r_x1": 475.599, "r_y1": 583.988, "r_x2": 475.599, "r_y2": 575.436, "r_x3": 458.165, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 223, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.029, "r_y0": 583.988, "r_x1": 514.463, "r_y1": 583.988, "r_x2": 514.463, "r_y2": 575.436, "r_x3": 497.029, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 224, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 350.723, "r_y0": 595.943, "r_x1": 391.311, "r_y1": 595.943, "r_x2": 391.311, "r_y2": 587.391, "r_x3": 350.723, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 225, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 595.943, "r_x1": 431.34, "r_y1": 595.943, "r_x2": 431.34, "r_y2": 587.391, "r_x3": 413.906, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 226, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 595.943, "r_x1": 475.604, "r_y1": 595.943, "r_x2": 475.604, "r_y2": 587.391, "r_x3": 458.17, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 227, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 595.943, "r_x1": 514.468, "r_y1": 595.943, "r_x2": 514.468, "r_y2": 587.391, "r_x3": 497.034, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 228, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.136, "r_y0": 607.899, "r_x1": 387.899, "r_y1": 607.899, "r_x2": 387.899, "r_y2": 599.347, "r_x3": 354.136, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 229, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.902, "r_y0": 607.899, "r_x1": 431.336, "r_y1": 607.899, "r_x2": 431.336, "r_y2": 599.347, "r_x3": 413.902, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 230, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 607.899, "r_x1": 475.6, "r_y1": 607.899, "r_x2": 475.6, "r_y2": 599.347, "r_x3": 458.165, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 231, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.03, "r_y0": 607.899, "r_x1": 514.464, "r_y1": 607.899, "r_x2": 514.464, "r_y2": 599.347, "r_x3": 497.03, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 232, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.559, "r_y0": 619.854, "r_x1": 395.475, "r_y1": 619.854, "r_x2": 395.475, "r_y2": 611.302, "r_x3": 346.559, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 233, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 619.854, "r_x1": 431.341, "r_y1": 619.854, "r_x2": 431.341, "r_y2": 611.302, "r_x3": 413.906, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 234, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 619.854, "r_x1": 475.605, "r_y1": 619.854, "r_x2": 475.605, "r_y2": 611.302, "r_x3": 458.17, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 235, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 619.854, "r_x1": 514.469, "r_y1": 619.854, "r_x2": 514.469, "r_y2": 611.302, "r_x3": 497.034, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 236, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.781, "r_y0": 631.809, "r_x1": 381.254, "r_y1": 631.809, "r_x2": 381.254, "r_y2": 623.2570000000001, "r_x3": 360.781, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 237, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.902, "r_y0": 631.809, "r_x1": 431.336, "r_y1": 631.809, "r_x2": 431.336, "r_y2": 623.2570000000001, "r_x3": 413.902, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 238, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 631.809, "r_x1": 475.6, "r_y1": 631.809, "r_x2": 475.6, "r_y2": 623.2570000000001, "r_x3": 458.165, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 239, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.03, "r_y0": 631.809, "r_x1": 514.464, "r_y1": 631.809, "r_x2": 514.464, "r_y2": 623.2570000000001, "r_x3": 497.03, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 240, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.483, "r_y0": 643.764, "r_x1": 396.551, "r_y1": 643.764, "r_x2": 396.551, "r_y2": 635.212, "r_x3": 345.483, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 241, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 643.764, "r_x1": 431.341, "r_y1": 643.764, "r_x2": 431.341, "r_y2": 635.212, "r_x3": 413.906, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 242, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 643.764, "r_x1": 475.605, "r_y1": 643.764, "r_x2": 475.605, "r_y2": 635.212, "r_x3": 458.17, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 243, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 643.78, "r_x1": 514.469, "r_y1": 643.78, "r_x2": 514.469, "r_y2": 634.8240000000001, "r_x3": 497.034, "r_y3": 634.8240000000001, "coord_origin": "TOPLEFT"}, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 99, "label": "text", "bbox": {"l": 358.011, "t": 552.502, "r": 384.023, "b": 561.054, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 215, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 358.011, "r_y0": 561.054, "r_x1": 384.023, "r_y1": 561.054, "r_x2": 384.023, "r_y2": 552.502, "r_x3": 358.011, "r_y3": 552.502, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 100, "label": "text", "bbox": {"l": 449.034, "t": 546.524, "r": 473.94, "b": 555.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 216, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.034, "r_y0": 555.076, "r_x1": 473.94, "r_y1": 555.076, "r_x2": 473.94, "r_y2": 546.524, "r_x3": 449.034, "r_y3": 546.524, "coord_origin": "TOPLEFT"}, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 101, "label": "text", "bbox": {"l": 408.506, "t": 558.479, "r": 436.74, "b": 567.031, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 217, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.506, "r_y0": 567.031, "r_x1": 436.74, "r_y1": 567.031, "r_x2": 436.74, "r_y2": 558.479, "r_x3": 408.506, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 102, "label": "text", "bbox": {"l": 448.695, "t": 558.479, "r": 485.079, "b": 567.031, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 218, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.695, "r_y0": 567.031, "r_x1": 485.079, "r_y1": 567.031, "r_x2": 485.079, "r_y2": 558.479, "r_x3": 448.695, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 103, "label": "text", "bbox": {"l": 499.385, "t": 558.479, "r": 512.117, "b": 567.031, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 219, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 499.385, "r_y0": 567.031, "r_x1": 512.117, "r_y1": 567.031, "r_x2": 512.117, "r_y2": 558.479, "r_x3": 499.385, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 104, "label": "text", "bbox": {"l": 357.682, "t": 575.436, "r": 384.352, "b": 583.988, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 220, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.682, "r_y0": 583.988, "r_x1": 384.352, "r_y1": 583.988, "r_x2": 384.352, "r_y2": 575.436, "r_x3": 357.682, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 105, "label": "text", "bbox": {"l": 413.901, "t": 575.436, "r": 431.336, "b": 583.988, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 221, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.901, "r_y0": 583.988, "r_x1": 431.336, "r_y1": 583.988, "r_x2": 431.336, "r_y2": 575.436, "r_x3": 413.901, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 106, "label": "text", "bbox": {"l": 458.165, "t": 575.436, "r": 475.599, "b": 583.988, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 222, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 583.988, "r_x1": 475.599, "r_y1": 583.988, "r_x2": 475.599, "r_y2": 575.436, "r_x3": 458.165, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 107, "label": "text", "bbox": {"l": 497.029, "t": 575.436, "r": 514.463, "b": 583.988, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 223, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.029, "r_y0": 583.988, "r_x1": 514.463, "r_y1": 583.988, "r_x2": 514.463, "r_y2": 575.436, "r_x3": 497.029, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 108, "label": "text", "bbox": {"l": 350.723, "t": 587.391, "r": 391.311, "b": 595.943, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 224, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 350.723, "r_y0": 595.943, "r_x1": 391.311, "r_y1": 595.943, "r_x2": 391.311, "r_y2": 587.391, "r_x3": 350.723, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 109, "label": "text", "bbox": {"l": 413.906, "t": 587.391, "r": 431.34, "b": 595.943, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 225, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 595.943, "r_x1": 431.34, "r_y1": 595.943, "r_x2": 431.34, "r_y2": 587.391, "r_x3": 413.906, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 110, "label": "text", "bbox": {"l": 458.17, "t": 587.391, "r": 475.604, "b": 595.943, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 226, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 595.943, "r_x1": 475.604, "r_y1": 595.943, "r_x2": 475.604, "r_y2": 587.391, "r_x3": 458.17, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 111, "label": "text", "bbox": {"l": 497.034, "t": 587.391, "r": 514.468, "b": 595.943, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 227, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 595.943, "r_x1": 514.468, "r_y1": 595.943, "r_x2": 514.468, "r_y2": 587.391, "r_x3": 497.034, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 112, "label": "text", "bbox": {"l": 354.136, "t": 599.347, "r": 387.899, "b": 607.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 228, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.136, "r_y0": 607.899, "r_x1": 387.899, "r_y1": 607.899, "r_x2": 387.899, "r_y2": 599.347, "r_x3": 354.136, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 113, "label": "text", "bbox": {"l": 413.902, "t": 599.347, "r": 431.336, "b": 607.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 229, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.902, "r_y0": 607.899, "r_x1": 431.336, "r_y1": 607.899, "r_x2": 431.336, "r_y2": 599.347, "r_x3": 413.902, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 114, "label": "text", "bbox": {"l": 458.165, "t": 599.347, "r": 475.6, "b": 607.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 230, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 607.899, "r_x1": 475.6, "r_y1": 607.899, "r_x2": 475.6, "r_y2": 599.347, "r_x3": 458.165, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 115, "label": "text", "bbox": {"l": 497.03, "t": 599.347, "r": 514.464, "b": 607.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 231, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.03, "r_y0": 607.899, "r_x1": 514.464, "r_y1": 607.899, "r_x2": 514.464, "r_y2": 599.347, "r_x3": 497.03, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 116, "label": "text", "bbox": {"l": 346.559, "t": 611.302, "r": 395.475, "b": 619.854, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 232, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.559, "r_y0": 619.854, "r_x1": 395.475, "r_y1": 619.854, "r_x2": 395.475, "r_y2": 611.302, "r_x3": 346.559, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 117, "label": "text", "bbox": {"l": 413.906, "t": 611.302, "r": 431.341, "b": 619.854, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 233, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 619.854, "r_x1": 431.341, "r_y1": 619.854, "r_x2": 431.341, "r_y2": 611.302, "r_x3": 413.906, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 118, "label": "text", "bbox": {"l": 458.17, "t": 611.302, "r": 475.605, "b": 619.854, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 234, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 619.854, "r_x1": 475.605, "r_y1": 619.854, "r_x2": 475.605, "r_y2": 611.302, "r_x3": 458.17, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 119, "label": "text", "bbox": {"l": 497.034, "t": 611.302, "r": 514.469, "b": 619.854, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 235, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 619.854, "r_x1": 514.469, "r_y1": 619.854, "r_x2": 514.469, "r_y2": 611.302, "r_x3": 497.034, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 120, "label": "text", "bbox": {"l": 360.781, "t": 623.2570000000001, "r": 381.254, "b": 631.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 236, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.781, "r_y0": 631.809, "r_x1": 381.254, "r_y1": 631.809, "r_x2": 381.254, "r_y2": 623.2570000000001, "r_x3": 360.781, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 121, "label": "text", "bbox": {"l": 413.902, "t": 623.2570000000001, "r": 431.336, "b": 631.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 237, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.902, "r_y0": 631.809, "r_x1": 431.336, "r_y1": 631.809, "r_x2": 431.336, "r_y2": 623.2570000000001, "r_x3": 413.902, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 122, "label": "text", "bbox": {"l": 458.165, "t": 623.2570000000001, "r": 475.6, "b": 631.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 238, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 631.809, "r_x1": 475.6, "r_y1": 631.809, "r_x2": 475.6, "r_y2": 623.2570000000001, "r_x3": 458.165, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 123, "label": "text", "bbox": {"l": 497.03, "t": 623.2570000000001, "r": 514.464, "b": 631.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 239, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.03, "r_y0": 631.809, "r_x1": 514.464, "r_y1": 631.809, "r_x2": 514.464, "r_y2": 623.2570000000001, "r_x3": 497.03, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 124, "label": "text", "bbox": {"l": 345.483, "t": 635.212, "r": 396.551, "b": 643.764, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 240, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.483, "r_y0": 643.764, "r_x1": 396.551, "r_y1": 643.764, "r_x2": 396.551, "r_y2": 635.212, "r_x3": 345.483, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 125, "label": "text", "bbox": {"l": 413.906, "t": 635.212, "r": 431.341, "b": 643.764, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 241, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 643.764, "r_x1": 431.341, "r_y1": 643.764, "r_x2": 431.341, "r_y2": 635.212, "r_x3": 413.906, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 126, "label": "text", "bbox": {"l": 458.17, "t": 635.212, "r": 475.605, "b": 643.764, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 242, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 643.764, "r_x1": 475.605, "r_y1": 643.764, "r_x2": 475.605, "r_y2": 635.212, "r_x3": 458.17, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 127, "label": "text", "bbox": {"l": 497.034, "t": 634.8240000000001, "r": 514.469, "b": 643.78, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 243, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 643.78, "r_x1": 514.469, "r_y1": 643.78, "r_x2": 514.469, "r_y2": 634.8240000000001, "r_x3": 497.034, "r_y3": 634.8240000000001, "coord_origin": "TOPLEFT"}, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["fcel", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 7, "num_cols": 4, "table_cells": [{"bbox": {"l": 358.011, "t": 552.502, "r": 384.023, "b": 561.054, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 448.695, "t": 546.524, "r": 485.079, "b": 567.031, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "TEDS Complex", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 408.506, "t": 558.479, "r": 436.74, "b": 567.031, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Simple", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 499.385, "t": 558.479, "r": 512.117, "b": 567.031, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "All", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 357.682, "t": 575.436, "r": 384.352, "b": 583.988, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Tabula", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 413.901, "t": 575.436, "r": 431.336, "b": 583.988, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "78.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 458.165, "t": 575.436, "r": 475.599, "b": 583.988, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "57.8", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 497.029, "t": 575.436, "r": 514.463, "b": 583.988, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "67.9", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 350.723, "t": 587.391, "r": 391.311, "b": 595.943, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Traprange", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 413.906, "t": 587.391, "r": 431.34, "b": 595.943, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "60.8", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 458.17, "t": 587.391, "r": 475.604, "b": 595.943, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "49.9", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 497.034, "t": 587.391, "r": 514.468, "b": 595.943, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "55.4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 354.136, "t": 599.347, "r": 387.899, "b": 607.899, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Camelot", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 413.902, "t": 599.347, "r": 431.336, "b": 607.899, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "80.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 458.165, "t": 599.347, "r": 475.6, "b": 607.899, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "66.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 497.03, "t": 599.347, "r": 514.464, "b": 607.899, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "73.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 346.559, "t": 611.302, "r": 395.475, "b": 619.854, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Acrobat Pro", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 413.906, "t": 611.302, "r": 431.341, "b": 619.854, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "68.9", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 458.17, "t": 611.302, "r": 475.605, "b": 619.854, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "61.8", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 497.034, "t": 611.302, "r": 514.469, "b": 619.854, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "65.3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 360.781, "t": 623.2570000000001, "r": 381.254, "b": 631.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 413.902, "t": 623.2570000000001, "r": 431.336, "b": 631.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "91.2", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 458.165, "t": 623.2570000000001, "r": 475.6, "b": 631.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "85.4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 497.03, "t": 623.2570000000001, "r": 514.464, "b": 631.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "88.3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 345.483, "t": 635.212, "r": 396.551, "b": 643.764, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 413.906, "t": 635.212, "r": 431.341, "b": 643.764, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "95.4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 458.17, "t": 635.212, "r": 475.605, "b": 643.764, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "90.1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 497.034, "t": 634.8240000000001, "r": 514.469, "b": 643.78, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "93.6", "column_header": false, "row_header": false, "row_section": false}]}}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "section_header", "id": 10, "page_no": 6, "cluster": {"id": 10, "label": "section_header", "bbox": {"l": 50.112, "t": 74.40099999999995, "r": 167.898, "b": 84.25300000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9554274082183838, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.25300000000004, "r_x1": 167.898, "r_y1": 84.25300000000004, "r_x2": 167.898, "r_y2": 74.40099999999995, "r_x3": 50.112, "r_y3": 74.40099999999995, "coord_origin": "TOPLEFT"}, "text": "5.3. Datasets and Metrics", "orig": "5.3. Datasets and Metrics", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.3. Datasets and Metrics"}, {"label": "text", "id": 1, "page_no": 6, "cluster": {"id": 1, "label": "text", "bbox": {"l": 50.112, "t": 93.61900000000003, "r": 286.365, "b": 138.03700000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.9862998127937317, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 102.17100000000005, "r_x1": 286.365, "r_y1": 102.17100000000005, "r_x2": 286.365, "r_y2": 93.61900000000003, "r_x3": 62.067, "r_y3": 93.61900000000003, "coord_origin": "TOPLEFT"}, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 114.12599999999998, "r_x1": 286.365, "r_y1": 114.12599999999998, "r_x2": 286.365, "r_y2": 105.57399999999996, "r_x3": 50.112, "r_y3": 105.57399999999996, "coord_origin": "TOPLEFT"}, "text": "ric was introduced in [37]. It represents the prediction, and", "orig": "ric was introduced in [37]. It represents the prediction, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 126.08100000000002, "r_x1": 239.999, "r_y1": 126.08100000000002, "r_x2": 239.999, "r_y2": 117.529, "r_x3": 50.112, "r_y3": 117.529, "coord_origin": "TOPLEFT"}, "text": "ground-truth as a tree structure of HTML tags.", "orig": "ground-truth as a tree structure of HTML tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.03, "r_y0": 126.08100000000002, "r_x1": 286.365, "r_y1": 126.08100000000002, "r_x2": 286.365, "r_y2": 117.529, "r_x3": 245.03, "r_y3": 117.529, "coord_origin": "TOPLEFT"}, "text": "This simi-", "orig": "This simi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 138.03700000000003, "r_x1": 136.717, "r_y1": 138.03700000000003, "r_x2": 136.717, "r_y2": 129.485, "r_x3": 50.112, "r_y3": 129.485, "coord_origin": "TOPLEFT"}, "text": "larity is calculated as:", "orig": "larity is calculated as:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) metric was introduced in [37]. It represents the prediction, and ground-truth as a tree structure of HTML tags. This similarity is calculated as:"}, {"label": "formula", "id": 13, "page_no": 6, "cluster": {"id": 13, "label": "formula", "bbox": {"l": 86.219, "t": 150.428, "r": 286.362, "b": 173.63199999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9500409364700317, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.219, "r_y0": 165.87400000000002, "r_x1": 118.878, "r_y1": 165.87400000000002, "r_x2": 118.878, "r_y2": 157.168, "r_x3": 86.219, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": "TEDS(", "orig": "TEDS(", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 118.875, "r_y0": 165.87400000000002, "r_x1": 139.77, "r_y1": 165.87400000000002, "r_x2": 139.77, "r_y2": 157.168, "r_x3": 118.875, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": "T , T", "orig": "T , T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.697, "r_y0": 166.798, "r_x1": 129.019, "r_y1": 166.798, "r_x2": 129.019, "r_y2": 160.70399999999995, "r_x3": 124.697, "r_y3": 160.70399999999995, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.766, "r_y0": 166.798, "r_x1": 143.27, "r_y1": 166.798, "r_x2": 143.27, "r_y2": 160.70399999999995, "r_x3": 139.766, "r_y3": 160.70399999999995, "coord_origin": "TOPLEFT"}, "text": "b", "orig": "b", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.768, "r_y0": 165.87400000000002, "r_x1": 165.902, "r_y1": 165.87400000000002, "r_x2": 165.902, "r_y2": 157.168, "r_x3": 143.768, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": ") = 1", "orig": ") = 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.121, "r_y0": 165.73199999999997, "r_x1": 175.87, "r_y1": 165.73199999999997, "r_x2": 175.87, "r_y2": 157.168, "r_x3": 168.121, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 179.279, "r_y0": 159.13400000000001, "r_x1": 221.957, "r_y1": 159.13400000000001, "r_x2": 221.957, "r_y2": 150.428, "r_x3": 179.279, "r_y3": 150.428, "coord_origin": "TOPLEFT"}, "text": "EditDist (", "orig": "EditDist (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.952, "r_y0": 159.13400000000001, "r_x1": 242.848, "r_y1": 159.13400000000001, "r_x2": 242.848, "r_y2": 150.428, "r_x3": 221.952, "r_y3": 150.428, "coord_origin": "TOPLEFT"}, "text": "T , T", "orig": "T , T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.774, "r_y0": 160.058, "r_x1": 232.096, "r_y1": 160.058, "r_x2": 232.096, "r_y2": 153.96400000000006, "r_x3": 227.774, "r_y3": 153.96400000000006, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.843, "r_y0": 160.058, "r_x1": 246.347, "r_y1": 160.058, "r_x2": 246.347, "r_y2": 153.96400000000006, "r_x3": 242.843, "r_y3": 153.96400000000006, "coord_origin": "TOPLEFT"}, "text": "b", "orig": "b", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.845, "r_y0": 159.13400000000001, "r_x1": 250.719, "r_y1": 159.13400000000001, "r_x2": 250.719, "r_y2": 150.428, "r_x3": 246.845, "r_y3": 150.428, "coord_origin": "TOPLEFT"}, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.212, "r_y0": 172.70799999999997, "r_x1": 206.292, "r_y1": 172.70799999999997, "r_x2": 206.292, "r_y2": 164.00199999999995, "r_x3": 182.212, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "max(", "orig": "max(", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.289, "r_y0": 172.56600000000003, "r_x1": 209.057, "r_y1": 172.56600000000003, "r_x2": 209.057, "r_y2": 164.00199999999995, "r_x3": 206.289, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.056, "r_y0": 172.70799999999997, "r_x1": 214.878, "r_y1": 172.70799999999997, "r_x2": 214.878, "r_y2": 164.00199999999995, "r_x3": 209.056, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.878, "r_y0": 173.63199999999995, "r_x1": 219.2, "r_y1": 173.63199999999995, "r_x2": 219.2, "r_y2": 167.538, "r_x3": 214.878, "r_y3": 167.538, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.697, "r_y0": 172.56600000000003, "r_x1": 222.465, "r_y1": 172.56600000000003, "r_x2": 222.465, "r_y2": 164.00199999999995, "r_x3": 219.697, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.125, "r_y0": 172.70799999999997, "r_x1": 226.893, "r_y1": 172.70799999999997, "r_x2": 226.893, "r_y2": 164.00199999999995, "r_x3": 224.125, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.553, "r_y0": 172.56600000000003, "r_x1": 231.321, "r_y1": 172.56600000000003, "r_x2": 231.321, "r_y2": 164.00199999999995, "r_x3": 228.553, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 231.32, "r_y0": 172.70799999999997, "r_x1": 237.142, "r_y1": 172.70799999999997, "r_x2": 237.142, "r_y2": 164.00199999999995, "r_x3": 231.32, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 237.142, "r_y0": 173.63199999999995, "r_x1": 240.646, "r_y1": 173.63199999999995, "r_x2": 240.646, "r_y2": 167.538, "r_x3": 237.142, "r_y3": 167.538, "coord_origin": "TOPLEFT"}, "text": "b", "orig": "b", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.144, "r_y0": 172.56600000000003, "r_x1": 243.912, "r_y1": 172.56600000000003, "r_x2": 243.912, "r_y2": 164.00199999999995, "r_x3": 241.144, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.911, "r_y0": 172.70799999999997, "r_x1": 247.785, "r_y1": 172.70799999999997, "r_x2": 247.785, "r_y2": 164.00199999999995, "r_x3": 243.911, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.746, "r_y0": 166.038, "r_x1": 286.362, "r_y1": 166.038, "r_x2": 286.362, "r_y2": 157.486, "r_x3": 274.746, "r_y3": 157.486, "coord_origin": "TOPLEFT"}, "text": "(3)", "orig": "(3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TEDS( T , T a b ) = 1 -EditDist ( T , T a b ) max( | T a | , | T b | ) (3)"}, {"label": "text", "id": 6, "page_no": 6, "cluster": {"id": 6, "label": "text", "bbox": {"l": 50.112, "t": 181.11300000000006, "r": 286.363, "b": 213.89300000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.9735319018363953, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 189.98299999999995, "r_x1": 86.406, "r_y1": 189.98299999999995, "r_x2": 86.406, "r_y2": 181.43100000000004, "r_x3": 62.067, "r_y3": 181.43100000000004, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.581, "r_y0": 189.81899999999996, "r_x1": 94.403, "r_y1": 189.81899999999996, "r_x2": 94.403, "r_y2": 181.11300000000006, "r_x3": 88.581, "r_y3": 181.11300000000006, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.403, "r_y0": 190.74199999999996, "r_x1": 98.725, "r_y1": 190.74199999999996, "r_x2": 98.725, "r_y2": 184.64800000000002, "r_x3": 94.403, "r_y3": 184.64800000000002, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.399, "r_y0": 189.98299999999995, "r_x1": 115.785, "r_y1": 189.98299999999995, "r_x2": 115.785, "r_y2": 181.43100000000004, "r_x3": 101.399, "r_y3": 181.43100000000004, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 117.961, "r_y0": 189.81899999999996, "r_x1": 123.783, "r_y1": 189.81899999999996, "r_x2": 123.783, "r_y2": 181.11300000000006, "r_x3": 117.961, "r_y3": 181.11300000000006, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 123.783, "r_y0": 190.74199999999996, "r_x1": 127.287, "r_y1": 190.74199999999996, "r_x2": 127.287, "r_y2": 184.64800000000002, "r_x3": 123.783, "r_y3": 184.64800000000002, "coord_origin": "TOPLEFT"}, "text": "b", "orig": "b", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.96, "r_y0": 189.98299999999995, "r_x1": 286.363, "r_y1": 189.98299999999995, "r_x2": 286.363, "r_y2": 181.43100000000004, "r_x3": 129.96, "r_y3": 181.43100000000004, "coord_origin": "TOPLEFT"}, "text": "represent tables in tree structure HTML", "orig": "represent tables in tree structure HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 201.938, "r_x1": 252.781, "r_y1": 201.938, "r_x2": 252.781, "r_y2": 193.38599999999997, "r_x3": 50.112, "r_y3": 193.38599999999997, "coord_origin": "TOPLEFT"}, "text": "format. EditDist denotes the tree-edit distance, and", "orig": "format. EditDist denotes the tree-edit distance, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.182, "r_y0": 201.63199999999995, "r_x1": 257.95, "r_y1": 201.63199999999995, "r_x2": 257.95, "r_y2": 193.06799999999998, "r_x3": 255.182, "r_y3": 193.06799999999998, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.949, "r_y0": 201.774, "r_x1": 263.771, "r_y1": 201.774, "r_x2": 263.771, "r_y2": 193.06799999999998, "r_x3": 257.949, "r_y3": 193.06799999999998, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.155, "r_y0": 201.63199999999995, "r_x1": 267.923, "r_y1": 201.63199999999995, "r_x2": 267.923, "r_y2": 193.06799999999998, "r_x3": 265.155, "r_y3": 193.06799999999998, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.322, "r_y0": 201.938, "r_x1": 286.362, "r_y1": 201.938, "r_x2": 286.362, "r_y2": 193.38599999999997, "r_x3": 270.322, "r_y3": 193.38599999999997, "coord_origin": "TOPLEFT"}, "text": "rep-", "orig": "rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 213.89300000000003, "r_x1": 172.134, "r_y1": 213.89300000000003, "r_x2": 172.134, "r_y2": 205.341, "r_x3": 50.112, "r_y3": 205.341, "coord_origin": "TOPLEFT"}, "text": "resents the number of nodes in", "orig": "resents the number of nodes in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 174.624, "r_y0": 213.72900000000004, "r_x1": 180.446, "r_y1": 213.72900000000004, "r_x2": 180.446, "r_y2": 205.02300000000002, "r_x3": 174.624, "r_y3": 205.02300000000002, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.829, "r_y0": 213.89300000000003, "r_x1": 184.32, "r_y1": 213.89300000000003, "r_x2": 184.32, "r_y2": 205.341, "r_x3": 181.829, "r_y3": 205.341, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "where T a and T b represent tables in tree structure HTML format. EditDist denotes the tree-edit distance, and | T | represents the number of nodes in T ."}, {"label": "section_header", "id": 9, "page_no": 6, "cluster": {"id": 9, "label": "section_header", "bbox": {"l": 50.112, "t": 224.81899999999996, "r": 170.452, "b": 234.67100000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9588837027549744, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 234.67100000000005, "r_x1": 170.452, "r_y1": 234.67100000000005, "r_x2": 170.452, "r_y2": 224.81899999999996, "r_x3": 50.112, "r_y3": 224.81899999999996, "coord_origin": "TOPLEFT"}, "text": "5.4. Quantitative Analysis", "orig": "5.4. Quantitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.4. Quantitative Analysis"}, {"label": "text", "id": 2, "page_no": 6, "cluster": {"id": 2, "label": "text", "bbox": {"l": 50.112, "t": 243.64999999999998, "r": 286.365, "b": 396.052, "coord_origin": "TOPLEFT"}, "confidence": 0.9855090975761414, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 252.606, "r_x1": 105.325, "r_y1": 252.606, "r_x2": 105.325, "r_y2": 243.64999999999998, "r_x3": 62.067, "r_y3": 243.64999999999998, "coord_origin": "TOPLEFT"}, "text": "Structure.", "orig": "Structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.126, "r_y0": 252.59000000000003, "r_x1": 184.684, "r_y1": 252.59000000000003, "r_x2": 184.684, "r_y2": 244.038, "r_x3": 112.126, "r_y3": 244.038, "coord_origin": "TOPLEFT"}, "text": "As shown in Tab.", "orig": "As shown in Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 191.478, "r_y0": 252.59000000000003, "r_x1": 198.95, "r_y1": 252.59000000000003, "r_x2": 198.95, "r_y2": 244.038, "r_x3": 191.478, "r_y3": 244.038, "coord_origin": "TOPLEFT"}, "text": "2,", "orig": "2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 202.995, "r_y0": 252.59000000000003, "r_x1": 286.362, "r_y1": 252.59000000000003, "r_x2": 286.362, "r_y2": 244.038, "r_x3": 202.995, "r_y3": 244.038, "coord_origin": "TOPLEFT"}, "text": "TableFormer outper-", "orig": "TableFormer outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 264.54499999999996, "r_x1": 286.365, "r_y1": 264.54499999999996, "r_x2": 286.365, "r_y2": 255.99300000000005, "r_x3": 50.112, "r_y3": 255.99300000000005, "coord_origin": "TOPLEFT"}, "text": "forms all SOTA methods across different datasets by a large", "orig": "forms all SOTA methods across different datasets by a large", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 276.5, "r_x1": 138.719, "r_y1": 276.5, "r_x2": 138.719, "r_y2": 267.948, "r_x3": 50.112, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "margin for predicting", "orig": "margin for predicting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.993, "r_y0": 276.5, "r_x1": 155.168, "r_y1": 276.5, "r_x2": 155.168, "r_y2": 267.948, "r_x3": 142.993, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.432, "r_y0": 276.5, "r_x1": 178.799, "r_y1": 276.5, "r_x2": 178.799, "r_y2": 267.948, "r_x3": 159.432, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.073, "r_y0": 276.5, "r_x1": 217.932, "r_y1": 276.5, "r_x2": 217.932, "r_y2": 267.948, "r_x3": 183.073, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.206, "r_y0": 276.5, "r_x1": 286.365, "r_y1": 276.5, "r_x2": 286.365, "r_y2": 267.948, "r_x3": 222.206, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "from an image.", "orig": "from an image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 288.455, "r_x1": 286.365, "r_y1": 288.455, "r_x2": 286.365, "r_y2": 279.903, "r_x3": 50.112, "r_y3": 279.903, "coord_origin": "TOPLEFT"}, "text": "All the more, our model outperforms pre-trained methods.", "orig": "All the more, our model outperforms pre-trained methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 300.411, "r_x1": 286.365, "r_y1": 300.411, "r_x2": 286.365, "r_y2": 291.859, "r_x3": 50.112, "r_y3": 291.859, "coord_origin": "TOPLEFT"}, "text": "During the evaluation we do not apply any table filtering.", "orig": "During the evaluation we do not apply any table filtering.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 312.366, "r_x1": 286.365, "r_y1": 312.366, "r_x2": 286.365, "r_y2": 303.814, "r_x3": 50.112, "r_y3": 303.814, "coord_origin": "TOPLEFT"}, "text": "We also provide our baseline results on the SynthTabNet", "orig": "We also provide our baseline results on the SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 324.321, "r_x1": 80.269, "r_y1": 324.321, "r_x2": 80.269, "r_y2": 315.769, "r_x3": 50.112, "r_y3": 315.769, "coord_origin": "TOPLEFT"}, "text": "dataset.", "orig": "dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.579, "r_y0": 324.321, "r_x1": 91.666, "r_y1": 324.321, "r_x2": 91.666, "r_y2": 315.769, "r_x3": 85.579, "r_y3": 315.769, "coord_origin": "TOPLEFT"}, "text": "It", "orig": "It", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.894, "r_y0": 324.321, "r_x1": 257.812, "r_y1": 324.321, "r_x2": 257.812, "r_y2": 315.769, "r_x3": 94.894, "r_y3": 315.769, "coord_origin": "TOPLEFT"}, "text": "has been observed that large tables (e.g.", "orig": "has been observed that large tables (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.122, "r_y0": 324.321, "r_x1": 286.365, "r_y1": 324.321, "r_x2": 286.365, "r_y2": 315.769, "r_x3": 263.122, "r_y3": 315.769, "coord_origin": "TOPLEFT"}, "text": "tables", "orig": "tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 336.276, "r_x1": 286.365, "r_y1": 336.276, "r_x2": 286.365, "r_y2": 327.724, "r_x3": 50.112, "r_y3": 327.724, "coord_origin": "TOPLEFT"}, "text": "that occupy half of the page or more) yield poor predictions.", "orig": "that occupy half of the page or more) yield poor predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 348.231, "r_x1": 286.365, "r_y1": 348.231, "r_x2": 286.365, "r_y2": 339.679, "r_x3": 50.112, "r_y3": 339.679, "coord_origin": "TOPLEFT"}, "text": "We attribute this issue to the image resizing during the pre-", "orig": "We attribute this issue to the image resizing during the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 360.186, "r_x1": 115.068, "r_y1": 360.186, "r_x2": 115.068, "r_y2": 351.634, "r_x3": 50.112, "r_y3": 351.634, "coord_origin": "TOPLEFT"}, "text": "processing step,", "orig": "processing step,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.203, "r_y0": 360.186, "r_x1": 134.147, "r_y1": 360.186, "r_x2": 134.147, "r_y2": 351.634, "r_x3": 119.203, "r_y3": 351.634, "coord_origin": "TOPLEFT"}, "text": "that", "orig": "that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.952, "r_y0": 360.186, "r_x1": 286.365, "r_y1": 360.186, "r_x2": 286.365, "r_y2": 351.634, "r_x3": 137.952, "r_y3": 351.634, "coord_origin": "TOPLEFT"}, "text": "produces downsampled images with", "orig": "produces downsampled images with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 372.142, "r_x1": 155.357, "r_y1": 372.142, "r_x2": 155.357, "r_y2": 363.59, "r_x3": 50.112, "r_y3": 363.59, "coord_origin": "TOPLEFT"}, "text": "indistinguishable features.", "orig": "indistinguishable features.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.378, "r_y0": 372.142, "r_x1": 286.365, "r_y1": 372.142, "r_x2": 286.365, "r_y2": 363.59, "r_x3": 160.378, "r_y3": 363.59, "coord_origin": "TOPLEFT"}, "text": "This problem can be addressed", "orig": "This problem can be addressed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 384.097, "r_x1": 286.365, "r_y1": 384.097, "r_x2": 286.365, "r_y2": 375.545, "r_x3": 50.112, "r_y3": 375.545, "coord_origin": "TOPLEFT"}, "text": "by treating such big tables with a separate model which ac-", "orig": "by treating such big tables with a separate model which ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 396.052, "r_x1": 170.012, "r_y1": 396.052, "r_x2": 170.012, "r_y2": 387.5, "r_x3": 50.112, "r_y3": 387.5, "coord_origin": "TOPLEFT"}, "text": "cepts a large input image size.", "orig": "cepts a large input image size.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Structure. As shown in Tab. 2, TableFormer outperforms all SOTA methods across different datasets by a large margin for predicting the table structure from an image. All the more, our model outperforms pre-trained methods. During the evaluation we do not apply any table filtering. We also provide our baseline results on the SynthTabNet dataset. It has been observed that large tables (e.g. tables that occupy half of the page or more) yield poor predictions. We attribute this issue to the image resizing during the preprocessing step, that produces downsampled images with indistinguishable features. This problem can be addressed by treating such big tables with a separate model which accepts a large input image size."}, {"label": "table", "id": 0, "page_no": 6, "cluster": {"id": 0, "label": "table", "bbox": {"l": 53.368526458740234, "t": 409.1357727050781, "r": 283.0443420410156, "b": 582.3977661132812, "coord_origin": "TOPLEFT"}, "confidence": 0.9892510175704956, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.843, "r_y0": 429.511, "r_x1": 104.855, "r_y1": 429.511, "r_x2": 104.855, "r_y2": 420.959, "r_x3": 78.843, "r_y3": 420.959, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.2, "r_y0": 423.533, "r_x1": 236.107, "r_y1": 423.533, "r_x2": 236.107, "r_y2": 414.981, "r_x3": 211.2, "r_y3": 414.981, "coord_origin": "TOPLEFT"}, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.338, "r_y0": 435.488, "r_x1": 159.216, "r_y1": 435.488, "r_x2": 159.216, "r_y2": 426.936, "r_x3": 129.338, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.171, "r_y0": 435.488, "r_x1": 199.405, "r_y1": 435.488, "r_x2": 199.405, "r_y2": 426.936, "r_x3": 171.171, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.36, "r_y0": 435.488, "r_x1": 247.744, "r_y1": 435.488, "r_x2": 247.744, "r_y2": 426.936, "r_x3": 211.36, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.54, "r_y0": 435.488, "r_x1": 277.273, "r_y1": 435.488, "r_x2": 277.273, "r_y2": 426.936, "r_x3": 264.54, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 452.445, "r_x1": 102.085, "r_y1": 452.445, "r_x2": 102.085, "r_y2": 443.893, "r_x3": 81.612, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.872, "r_y0": 452.445, "r_x1": 153.691, "r_y1": 452.445, "r_x2": 153.691, "r_y2": 443.893, "r_x3": 134.872, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 452.445, "r_x1": 194.0, "r_y1": 452.445, "r_x2": 194.0, "r_y2": 443.893, "r_x3": 176.566, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.829, "r_y0": 452.445, "r_x1": 238.264, "r_y1": 452.445, "r_x2": 238.264, "r_y2": 443.893, "r_x3": 220.829, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 452.445, "r_x1": 279.619, "r_y1": 452.445, "r_x2": 279.619, "r_y2": 443.893, "r_x3": 262.184, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.165, "r_y0": 464.401, "r_x1": 101.532, "r_y1": 464.401, "r_x2": 101.532, "r_y2": 455.849, "r_x3": 82.165, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.867, "r_y0": 464.401, "r_x1": 153.687, "r_y1": 464.401, "r_x2": 153.687, "r_y2": 455.849, "r_x3": 134.867, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.624, "r_y0": 464.401, "r_x1": 186.942, "r_y1": 464.401, "r_x2": 186.942, "r_y2": 455.849, "r_x3": 183.624, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 464.401, "r_x1": 231.205, "r_y1": 464.401, "r_x2": 231.205, "r_y2": 455.849, "r_x3": 227.888, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.699, "r_y0": 464.401, "r_x1": 282.114, "r_y1": 464.401, "r_x2": 282.114, "r_y2": 455.849, "r_x3": 259.699, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 476.954, "r_x1": 117.383, "r_y1": 476.954, "r_x2": 117.383, "r_y2": 468.402, "r_x3": 66.315, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 476.954, "r_x1": 153.687, "r_y1": 476.954, "r_x2": 153.687, "r_y2": 468.402, "r_x3": 134.868, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 476.954, "r_x1": 194.006, "r_y1": 476.954, "r_x2": 194.006, "r_y2": 468.402, "r_x3": 176.571, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 476.954, "r_x1": 238.269, "r_y1": 476.954, "r_x2": 238.269, "r_y2": 468.402, "r_x3": 220.835, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.698, "r_y0": 476.97, "r_x1": 282.114, "r_y1": 476.97, "r_x2": 282.114, "r_y2": 468.014, "r_x3": 259.698, "r_y3": 468.014, "coord_origin": "TOPLEFT"}, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 492.147, "r_x1": 102.085, "r_y1": 492.147, "r_x2": 102.085, "r_y2": 483.595, "r_x3": 81.612, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.872, "r_y0": 492.147, "r_x1": 153.691, "r_y1": 492.147, "r_x2": 153.691, "r_y2": 483.595, "r_x3": 134.872, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 492.147, "r_x1": 194.0, "r_y1": 492.147, "r_x2": 194.0, "r_y2": 483.595, "r_x3": 176.566, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 218.339, "r_y0": 492.147, "r_x1": 240.755, "r_y1": 492.147, "r_x2": 240.755, "r_y2": 483.595, "r_x3": 218.339, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 492.147, "r_x1": 279.619, "r_y1": 492.147, "r_x2": 279.619, "r_y2": 483.595, "r_x3": 262.184, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.165, "r_y0": 504.102, "r_x1": 101.532, "r_y1": 504.102, "r_x2": 101.532, "r_y2": 495.55, "r_x3": 82.165, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.867, "r_y0": 504.102, "r_x1": 153.687, "r_y1": 504.102, "r_x2": 153.687, "r_y2": 495.55, "r_x3": 134.867, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.624, "r_y0": 504.102, "r_x1": 186.942, "r_y1": 504.102, "r_x2": 186.942, "r_y2": 495.55, "r_x3": 183.624, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 504.102, "r_x1": 231.205, "r_y1": 504.102, "r_x2": 231.205, "r_y2": 495.55, "r_x3": 227.888, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.699, "r_y0": 504.102, "r_x1": 282.114, "r_y1": 504.102, "r_x2": 282.114, "r_y2": 495.55, "r_x3": 259.699, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 71.789, "r_y0": 516.057, "r_x1": 111.908, "r_y1": 516.057, "r_x2": 111.908, "r_y2": 507.505, "r_x3": 71.789, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.862, "r_y0": 516.057, "r_x1": 153.682, "r_y1": 516.057, "r_x2": 153.682, "r_y2": 507.505, "r_x3": 134.862, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.629, "r_y0": 516.057, "r_x1": 186.947, "r_y1": 516.057, "r_x2": 186.947, "r_y2": 507.505, "r_x3": 183.629, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.893, "r_y0": 516.057, "r_x1": 231.211, "r_y1": 516.057, "r_x2": 231.211, "r_y2": 507.505, "r_x3": 227.893, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.694, "r_y0": 516.057, "r_x1": 282.109, "r_y1": 516.057, "r_x2": 282.109, "r_y2": 507.505, "r_x3": 259.694, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 528.012, "r_x1": 117.383, "r_y1": 528.012, "r_x2": 117.383, "r_y2": 519.46, "r_x3": 66.315, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 528.012, "r_x1": 153.687, "r_y1": 528.012, "r_x2": 153.687, "r_y2": 519.46, "r_x3": 134.868, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 528.012, "r_x1": 194.006, "r_y1": 528.012, "r_x2": 194.006, "r_y2": 519.46, "r_x3": 176.571, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 528.012, "r_x1": 238.269, "r_y1": 528.012, "r_x2": 238.269, "r_y2": 519.46, "r_x3": 220.835, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.189, "r_y0": 528.028, "r_x1": 279.624, "r_y1": 528.028, "r_x2": 279.624, "r_y2": 519.072, "r_x3": 262.189, "r_y3": 519.072, "coord_origin": "TOPLEFT"}, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 545.319, "r_x1": 102.085, "r_y1": 545.319, "r_x2": 102.085, "r_y2": 536.767, "r_x3": 81.612, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.911, "r_y0": 545.319, "r_x1": 150.643, "r_y1": 545.319, "r_x2": 150.643, "r_y2": 536.767, "r_x3": 137.911, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 545.319, "r_x1": 194.0, "r_y1": 545.319, "r_x2": 194.0, "r_y2": 536.767, "r_x3": 176.566, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.893, "r_y0": 545.319, "r_x1": 231.21, "r_y1": 545.319, "r_x2": 231.21, "r_y2": 536.767, "r_x3": 227.893, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 545.319, "r_x1": 279.619, "r_y1": 545.319, "r_x2": 279.619, "r_y2": 536.767, "r_x3": 262.184, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 557.275, "r_x1": 117.383, "r_y1": 557.275, "r_x2": 117.383, "r_y2": 548.723, "r_x3": 66.315, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.906, "r_y0": 557.275, "r_x1": 150.638, "r_y1": 557.275, "r_x2": 150.638, "r_y2": 548.723, "r_x3": 137.906, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 557.275, "r_x1": 194.006, "r_y1": 557.275, "r_x2": 194.006, "r_y2": 548.723, "r_x3": 176.571, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 557.275, "r_x1": 231.206, "r_y1": 557.275, "r_x2": 231.206, "r_y2": 548.723, "r_x3": 227.888, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.189, "r_y0": 557.2909999999999, "r_x1": 279.624, "r_y1": 557.2909999999999, "r_x2": 279.624, "r_y2": 548.335, "r_x3": 262.189, "r_y3": 548.335, "coord_origin": "TOPLEFT"}, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 576.823, "r_x1": 117.383, "r_y1": 576.823, "r_x2": 117.383, "r_y2": 568.271, "r_x3": 66.315, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 576.823, "r_x1": 153.687, "r_y1": 576.823, "r_x2": 153.687, "r_y2": 568.271, "r_x3": 134.868, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 576.823, "r_x1": 194.006, "r_y1": 576.823, "r_x2": 194.006, "r_y2": 568.271, "r_x3": 176.571, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 576.823, "r_x1": 238.269, "r_y1": 576.823, "r_x2": 238.269, "r_y2": 568.271, "r_x3": 220.835, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.19, "r_y0": 576.823, "r_x1": 279.624, "r_y1": 576.823, "r_x2": 279.624, "r_y2": 568.271, "r_x3": 262.19, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 27, "label": "text", "bbox": {"l": 78.843, "t": 420.959, "r": 104.855, "b": 429.511, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.843, "r_y0": 429.511, "r_x1": 104.855, "r_y1": 429.511, "r_x2": 104.855, "r_y2": 420.959, "r_x3": 78.843, "r_y3": 420.959, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 211.2, "t": 414.981, "r": 236.107, "b": 423.533, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.2, "r_y0": 423.533, "r_x1": 236.107, "r_y1": 423.533, "r_x2": 236.107, "r_y2": 414.981, "r_x3": 211.2, "r_y3": 414.981, "coord_origin": "TOPLEFT"}, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 129.338, "t": 426.936, "r": 159.216, "b": 435.488, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.338, "r_y0": 435.488, "r_x1": 159.216, "r_y1": 435.488, "r_x2": 159.216, "r_y2": 426.936, "r_x3": 129.338, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 171.171, "t": 426.936, "r": 199.405, "b": 435.488, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.171, "r_y0": 435.488, "r_x1": 199.405, "r_y1": 435.488, "r_x2": 199.405, "r_y2": 426.936, "r_x3": 171.171, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 211.36, "t": 426.936, "r": 247.744, "b": 435.488, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.36, "r_y0": 435.488, "r_x1": 247.744, "r_y1": 435.488, "r_x2": 247.744, "r_y2": 426.936, "r_x3": 211.36, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 264.54, "t": 426.936, "r": 277.273, "b": 435.488, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.54, "r_y0": 435.488, "r_x1": 277.273, "r_y1": 435.488, "r_x2": 277.273, "r_y2": 426.936, "r_x3": 264.54, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 81.612, "t": 443.893, "r": 102.085, "b": 452.445, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 452.445, "r_x1": 102.085, "r_y1": 452.445, "r_x2": 102.085, "r_y2": 443.893, "r_x3": 81.612, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 134.872, "t": 443.893, "r": 153.691, "b": 452.445, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.872, "r_y0": 452.445, "r_x1": 153.691, "r_y1": 452.445, "r_x2": 153.691, "r_y2": 443.893, "r_x3": 134.872, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 176.566, "t": 443.893, "r": 194.0, "b": 452.445, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 452.445, "r_x1": 194.0, "r_y1": 452.445, "r_x2": 194.0, "r_y2": 443.893, "r_x3": 176.566, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 220.829, "t": 443.893, "r": 238.264, "b": 452.445, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.829, "r_y0": 452.445, "r_x1": 238.264, "r_y1": 452.445, "r_x2": 238.264, "r_y2": 443.893, "r_x3": 220.829, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 262.184, "t": 443.893, "r": 279.619, "b": 452.445, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 452.445, "r_x1": 279.619, "r_y1": 452.445, "r_x2": 279.619, "r_y2": 443.893, "r_x3": 262.184, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 82.165, "t": 455.849, "r": 101.532, "b": 464.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.165, "r_y0": 464.401, "r_x1": 101.532, "r_y1": 464.401, "r_x2": 101.532, "r_y2": 455.849, "r_x3": 82.165, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 134.867, "t": 455.849, "r": 153.687, "b": 464.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.867, "r_y0": 464.401, "r_x1": 153.687, "r_y1": 464.401, "r_x2": 153.687, "r_y2": 455.849, "r_x3": 134.867, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 183.624, "t": 455.849, "r": 186.942, "b": 464.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.624, "r_y0": 464.401, "r_x1": 186.942, "r_y1": 464.401, "r_x2": 186.942, "r_y2": 455.849, "r_x3": 183.624, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 227.888, "t": 455.849, "r": 231.205, "b": 464.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 464.401, "r_x1": 231.205, "r_y1": 464.401, "r_x2": 231.205, "r_y2": 455.849, "r_x3": 227.888, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 259.699, "t": 455.849, "r": 282.114, "b": 464.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.699, "r_y0": 464.401, "r_x1": 282.114, "r_y1": 464.401, "r_x2": 282.114, "r_y2": 455.849, "r_x3": 259.699, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 66.315, "t": 468.402, "r": 117.383, "b": 476.954, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 476.954, "r_x1": 117.383, "r_y1": 476.954, "r_x2": 117.383, "r_y2": 468.402, "r_x3": 66.315, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 134.868, "t": 468.402, "r": 153.687, "b": 476.954, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 476.954, "r_x1": 153.687, "r_y1": 476.954, "r_x2": 153.687, "r_y2": 468.402, "r_x3": 134.868, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 176.571, "t": 468.402, "r": 194.006, "b": 476.954, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 476.954, "r_x1": 194.006, "r_y1": 476.954, "r_x2": 194.006, "r_y2": 468.402, "r_x3": 176.571, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 220.835, "t": 468.402, "r": 238.269, "b": 476.954, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 476.954, "r_x1": 238.269, "r_y1": 476.954, "r_x2": 238.269, "r_y2": 468.402, "r_x3": 220.835, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 259.698, "t": 468.014, "r": 282.114, "b": 476.97, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.698, "r_y0": 476.97, "r_x1": 282.114, "r_y1": 476.97, "r_x2": 282.114, "r_y2": 468.014, "r_x3": 259.698, "r_y3": 468.014, "coord_origin": "TOPLEFT"}, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 81.612, "t": 483.595, "r": 102.085, "b": 492.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 492.147, "r_x1": 102.085, "r_y1": 492.147, "r_x2": 102.085, "r_y2": 483.595, "r_x3": 81.612, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 134.872, "t": 483.595, "r": 153.691, "b": 492.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.872, "r_y0": 492.147, "r_x1": 153.691, "r_y1": 492.147, "r_x2": 153.691, "r_y2": 483.595, "r_x3": 134.872, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 176.566, "t": 483.595, "r": 194.0, "b": 492.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 492.147, "r_x1": 194.0, "r_y1": 492.147, "r_x2": 194.0, "r_y2": 483.595, "r_x3": 176.566, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 218.339, "t": 483.595, "r": 240.755, "b": 492.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 218.339, "r_y0": 492.147, "r_x1": 240.755, "r_y1": 492.147, "r_x2": 240.755, "r_y2": 483.595, "r_x3": 218.339, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 262.184, "t": 483.595, "r": 279.619, "b": 492.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 492.147, "r_x1": 279.619, "r_y1": 492.147, "r_x2": 279.619, "r_y2": 483.595, "r_x3": 262.184, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 82.165, "t": 495.55, "r": 101.532, "b": 504.102, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.165, "r_y0": 504.102, "r_x1": 101.532, "r_y1": 504.102, "r_x2": 101.532, "r_y2": 495.55, "r_x3": 82.165, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 134.867, "t": 495.55, "r": 153.687, "b": 504.102, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.867, "r_y0": 504.102, "r_x1": 153.687, "r_y1": 504.102, "r_x2": 153.687, "r_y2": 495.55, "r_x3": 134.867, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 183.624, "t": 495.55, "r": 186.942, "b": 504.102, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.624, "r_y0": 504.102, "r_x1": 186.942, "r_y1": 504.102, "r_x2": 186.942, "r_y2": 495.55, "r_x3": 183.624, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 227.888, "t": 495.55, "r": 231.205, "b": 504.102, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 504.102, "r_x1": 231.205, "r_y1": 504.102, "r_x2": 231.205, "r_y2": 495.55, "r_x3": 227.888, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 259.699, "t": 495.55, "r": 282.114, "b": 504.102, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.699, "r_y0": 504.102, "r_x1": 282.114, "r_y1": 504.102, "r_x2": 282.114, "r_y2": 495.55, "r_x3": 259.699, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 71.789, "t": 507.505, "r": 111.908, "b": 516.057, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 71.789, "r_y0": 516.057, "r_x1": 111.908, "r_y1": 516.057, "r_x2": 111.908, "r_y2": 507.505, "r_x3": 71.789, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 134.862, "t": 507.505, "r": 153.682, "b": 516.057, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.862, "r_y0": 516.057, "r_x1": 153.682, "r_y1": 516.057, "r_x2": 153.682, "r_y2": 507.505, "r_x3": 134.862, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 183.629, "t": 507.505, "r": 186.947, "b": 516.057, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.629, "r_y0": 516.057, "r_x1": 186.947, "r_y1": 516.057, "r_x2": 186.947, "r_y2": 507.505, "r_x3": 183.629, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 227.893, "t": 507.505, "r": 231.211, "b": 516.057, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.893, "r_y0": 516.057, "r_x1": 231.211, "r_y1": 516.057, "r_x2": 231.211, "r_y2": 507.505, "r_x3": 227.893, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 259.694, "t": 507.505, "r": 282.109, "b": 516.057, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.694, "r_y0": 516.057, "r_x1": 282.109, "r_y1": 516.057, "r_x2": 282.109, "r_y2": 507.505, "r_x3": 259.694, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 66.315, "t": 519.46, "r": 117.383, "b": 528.012, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 528.012, "r_x1": 117.383, "r_y1": 528.012, "r_x2": 117.383, "r_y2": 519.46, "r_x3": 66.315, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 134.868, "t": 519.46, "r": 153.687, "b": 528.012, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 528.012, "r_x1": 153.687, "r_y1": 528.012, "r_x2": 153.687, "r_y2": 519.46, "r_x3": 134.868, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 176.571, "t": 519.46, "r": 194.006, "b": 528.012, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 528.012, "r_x1": 194.006, "r_y1": 528.012, "r_x2": 194.006, "r_y2": 519.46, "r_x3": 176.571, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 220.835, "t": 519.46, "r": 238.269, "b": 528.012, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 528.012, "r_x1": 238.269, "r_y1": 528.012, "r_x2": 238.269, "r_y2": 519.46, "r_x3": 220.835, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 262.189, "t": 519.072, "r": 279.624, "b": 528.028, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.189, "r_y0": 528.028, "r_x1": 279.624, "r_y1": 528.028, "r_x2": 279.624, "r_y2": 519.072, "r_x3": 262.189, "r_y3": 519.072, "coord_origin": "TOPLEFT"}, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 81.612, "t": 536.767, "r": 102.085, "b": 545.319, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 545.319, "r_x1": 102.085, "r_y1": 545.319, "r_x2": 102.085, "r_y2": 536.767, "r_x3": 81.612, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 137.911, "t": 536.767, "r": 150.643, "b": 545.319, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.911, "r_y0": 545.319, "r_x1": 150.643, "r_y1": 545.319, "r_x2": 150.643, "r_y2": 536.767, "r_x3": 137.911, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 176.566, "t": 536.767, "r": 194.0, "b": 545.319, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 545.319, "r_x1": 194.0, "r_y1": 545.319, "r_x2": 194.0, "r_y2": 536.767, "r_x3": 176.566, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 227.893, "t": 536.767, "r": 231.21, "b": 545.319, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.893, "r_y0": 545.319, "r_x1": 231.21, "r_y1": 545.319, "r_x2": 231.21, "r_y2": 536.767, "r_x3": 227.893, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 262.184, "t": 536.767, "r": 279.619, "b": 545.319, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 545.319, "r_x1": 279.619, "r_y1": 545.319, "r_x2": 279.619, "r_y2": 536.767, "r_x3": 262.184, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 66.315, "t": 548.723, "r": 117.383, "b": 557.275, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 557.275, "r_x1": 117.383, "r_y1": 557.275, "r_x2": 117.383, "r_y2": 548.723, "r_x3": 66.315, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 137.906, "t": 548.723, "r": 150.638, "b": 557.275, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.906, "r_y0": 557.275, "r_x1": 150.638, "r_y1": 557.275, "r_x2": 150.638, "r_y2": 548.723, "r_x3": 137.906, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 176.571, "t": 548.723, "r": 194.006, "b": 557.275, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 557.275, "r_x1": 194.006, "r_y1": 557.275, "r_x2": 194.006, "r_y2": 548.723, "r_x3": 176.571, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 227.888, "t": 548.723, "r": 231.206, "b": 557.275, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 557.275, "r_x1": 231.206, "r_y1": 557.275, "r_x2": 231.206, "r_y2": 548.723, "r_x3": 227.888, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 262.189, "t": 548.335, "r": 279.624, "b": 557.2909999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.189, "r_y0": 557.2909999999999, "r_x1": 279.624, "r_y1": 557.2909999999999, "r_x2": 279.624, "r_y2": 548.335, "r_x3": 262.189, "r_y3": 548.335, "coord_origin": "TOPLEFT"}, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 66.315, "t": 568.271, "r": 117.383, "b": 576.823, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 576.823, "r_x1": 117.383, "r_y1": 576.823, "r_x2": 117.383, "r_y2": 568.271, "r_x3": 66.315, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 134.868, "t": 568.271, "r": 153.687, "b": 576.823, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 576.823, "r_x1": 153.687, "r_y1": 576.823, "r_x2": 153.687, "r_y2": 568.271, "r_x3": 134.868, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 176.571, "t": 568.271, "r": 194.006, "b": 576.823, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 576.823, "r_x1": 194.006, "r_y1": 576.823, "r_x2": 194.006, "r_y2": 568.271, "r_x3": 176.571, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 220.835, "t": 568.271, "r": 238.269, "b": 576.823, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 576.823, "r_x1": 238.269, "r_y1": 576.823, "r_x2": 238.269, "r_y2": 568.271, "r_x3": 220.835, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 82, "label": "text", "bbox": {"l": 262.19, "t": 568.271, "r": 279.624, "b": 576.823, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.19, "r_y0": 576.823, "r_x1": 279.624, "r_y1": 576.823, "r_x2": 279.624, "r_y2": 568.271, "r_x3": 262.19, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 11, "num_cols": 5, "table_cells": [{"bbox": {"l": 78.843, "t": 420.959, "r": 104.855, "b": 429.511, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 211.2, "t": 414.981, "r": 247.744, "b": 435.488, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "TEDS Complex", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 129.338, "t": 426.936, "r": 159.216, "b": 435.488, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Dataset", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 171.171, "t": 426.936, "r": 199.405, "b": 435.488, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Simple", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 264.54, "t": 426.936, "r": 277.273, "b": 435.488, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "All", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 81.612, "t": 443.893, "r": 102.085, "b": 452.445, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.872, "t": 443.893, "r": 153.691, "b": 452.445, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.566, "t": 443.893, "r": 194.0, "b": 452.445, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "91.1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.829, "t": 443.893, "r": 238.264, "b": 452.445, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "88.7", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 262.184, "t": 443.893, "r": 279.619, "b": 452.445, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "89.9", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 82.165, "t": 455.849, "r": 101.532, "b": 464.401, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.867, "t": 455.849, "r": 153.687, "b": 464.401, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 183.624, "t": 455.849, "r": 186.942, "b": 464.401, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 227.888, "t": 455.849, "r": 231.205, "b": 464.401, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 259.699, "t": 455.849, "r": 282.114, "b": 464.401, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "93.01", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 66.315, "t": 468.402, "r": 117.383, "b": 476.954, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.868, "t": 468.402, "r": 153.687, "b": 476.954, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.571, "t": 468.402, "r": 194.006, "b": 476.954, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "98.5", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.835, "t": 468.402, "r": 238.269, "b": 476.954, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "95.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 259.698, "t": 468.014, "r": 282.114, "b": 476.97, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.75", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 81.612, "t": 483.595, "r": 102.085, "b": 492.147, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.872, "t": 483.595, "r": 153.691, "b": 492.147, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.566, "t": 483.595, "r": 194.0, "b": 492.147, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "88.4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 218.339, "t": 483.595, "r": 240.755, "b": 492.147, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "92.08", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 262.184, "t": 483.595, "r": 279.619, "b": 492.147, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "90.6", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 82.165, "t": 495.55, "r": 101.532, "b": 504.102, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.867, "t": 495.55, "r": 153.687, "b": 504.102, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 183.624, "t": 495.55, "r": 186.942, "b": 504.102, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 227.888, "t": 495.55, "r": 231.205, "b": 504.102, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 259.699, "t": 495.55, "r": 282.114, "b": 504.102, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "87.14", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 71.789, "t": 507.505, "r": 111.908, "b": 516.057, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE (FT)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.862, "t": 507.505, "r": 153.682, "b": 516.057, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 183.629, "t": 507.505, "r": 186.947, "b": 516.057, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 227.893, "t": 507.505, "r": 231.211, "b": 516.057, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 259.694, "t": 507.505, "r": 282.109, "b": 516.057, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "91.02", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 66.315, "t": 519.46, "r": 117.383, "b": 528.012, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.868, "t": 519.46, "r": 153.687, "b": 528.012, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.571, "t": 519.46, "r": 194.006, "b": 528.012, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "97.5", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.835, "t": 519.46, "r": 238.269, "b": 528.012, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "96.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 262.189, "t": 519.072, "r": 279.624, "b": 528.028, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.8", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 81.612, "t": 536.767, "r": 102.085, "b": 545.319, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 137.911, "t": 536.767, "r": 150.643, "b": 545.319, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "TB", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.566, "t": 536.767, "r": 194.0, "b": 545.319, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "86.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 227.893, "t": 536.767, "r": 231.21, "b": 545.319, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 262.184, "t": 536.767, "r": 279.619, "b": 545.319, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "86.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 66.315, "t": 548.723, "r": 117.383, "b": 557.275, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 137.906, "t": 548.723, "r": 150.638, "b": 557.275, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "TB", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.571, "t": 548.723, "r": 194.006, "b": 557.275, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "89.6", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 227.888, "t": 548.723, "r": 231.206, "b": 557.275, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 262.189, "t": 548.335, "r": 279.624, "b": 557.2909999999999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "89.6", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 66.315, "t": 568.271, "r": 117.383, "b": 576.823, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.868, "t": 568.271, "r": 153.687, "b": 576.823, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "STN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.571, "t": 568.271, "r": 194.006, "b": 576.823, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "96.9", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.835, "t": 568.271, "r": 238.269, "b": 576.823, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "95.7", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 262.19, "t": 568.271, "r": 279.624, "b": 576.823, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.7", "column_header": false, "row_header": false, "row_section": false}]}, {"label": "text", "id": 15, "page_no": 6, "cluster": {"id": 15, "label": "text", "bbox": {"l": 50.112, "t": 592.702, "r": 286.365, "b": 613.2090000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.7209173440933228, "cells": [{"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 601.254, "r_x1": 82.062, "r_y1": 601.254, "r_x2": 82.062, "r_y2": 592.702, "r_x3": 50.112, "r_y3": 592.702, "coord_origin": "TOPLEFT"}, "text": "Table 2:", "orig": "Table 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.382, "r_y0": 601.254, "r_x1": 286.365, "r_y1": 601.254, "r_x2": 286.365, "r_y2": 592.702, "r_x3": 87.382, "r_y3": 592.702, "coord_origin": "TOPLEFT"}, "text": "Structure results on PubTabNet (PTN), FinTabNet", "orig": "Structure results on PubTabNet (PTN), FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 613.2090000000001, "r_x1": 247.461, "r_y1": 613.2090000000001, "r_x2": 247.461, "r_y2": 604.657, "r_x3": 50.112, "r_y3": 604.657, "coord_origin": "TOPLEFT"}, "text": "(FTN), TableBank (TB) and SynthTabNet (STN).", "orig": "(FTN), TableBank (TB) and SynthTabNet (STN).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet (FTN), TableBank (TB) and SynthTabNet (STN)."}, {"label": "text", "id": 16, "page_no": 6, "cluster": {"id": 16, "label": "text", "bbox": {"l": 50.112, "t": 616.612, "r": 261.787, "b": 625.164, "coord_origin": "TOPLEFT"}, "confidence": 0.6433312892913818, "cells": [{"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 625.164, "r_x1": 261.787, "r_y1": 625.164, "r_x2": 261.787, "r_y2": 616.612, "r_x3": 50.112, "r_y3": 616.612, "coord_origin": "TOPLEFT"}, "text": "FT: Model was trained on PubTabNet then finetuned.", "orig": "FT: Model was trained on PubTabNet then finetuned.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "FT: Model was trained on PubTabNet then finetuned."}, {"label": "text", "id": 3, "page_no": 6, "cluster": {"id": 3, "label": "text", "bbox": {"l": 50.112, "t": 644.35, "r": 286.366, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9854635000228882, "cells": [{"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 653.306, "r_x1": 124.722, "r_y1": 653.306, "r_x2": 124.722, "r_y2": 644.35, "r_x3": 62.067, "r_y3": 644.35, "coord_origin": "TOPLEFT"}, "text": "Cell Detection.", "orig": "Cell Detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.204, "r_y0": 653.29, "r_x1": 242.933, "r_y1": 653.29, "r_x2": 242.933, "r_y2": 644.738, "r_x3": 128.204, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "Like any object detector, our", "orig": "Like any object detector, our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.554, "r_y0": 653.1469999999999, "r_x1": 286.361, "r_y1": 653.1469999999999, "r_x2": 286.361, "r_y2": 644.559, "r_x3": 245.554, "r_y3": 644.559, "coord_origin": "TOPLEFT"}, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 665.102, "r_x1": 84.971, "r_y1": 665.102, "r_x2": 84.971, "r_y2": 656.514, "r_x3": 50.112, "r_y3": 656.514, "coord_origin": "TOPLEFT"}, "text": "Detector", "orig": "Detector", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 89.515, "r_y0": 665.245, "r_x1": 123.677, "r_y1": 665.245, "r_x2": 123.677, "r_y2": 656.693, "r_x3": 89.515, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "provides", "orig": "provides", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 127.991, "r_y0": 665.245, "r_x1": 286.366, "r_y1": 665.245, "r_x2": 286.366, "r_y2": 656.693, "r_x3": 127.991, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "bounding boxes that can be improved", "orig": "bounding boxes that can be improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.2, "r_x1": 286.365, "r_y1": 677.2, "r_x2": 286.365, "r_y2": 668.648, "r_x3": 50.112, "r_y3": 668.648, "coord_origin": "TOPLEFT"}, "text": "with post-processing during inference. We make use of the", "orig": "with post-processing during inference. We make use of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 259.655, "r_y1": 689.156, "r_x2": 259.655, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "grid-like structure of tables to refine the predictions.", "orig": "grid-like structure of tables to refine the predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.65, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 263.65, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "A de-", "orig": "A de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "tailed explanation on the post-processing is available in the", "orig": "tailed explanation on the post-processing is available in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 147.068, "r_y1": 713.066, "r_x2": 147.068, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "supplementary material.", "orig": "supplementary material.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.159, "r_y0": 713.066, "r_x1": 223.003, "r_y1": 713.066, "r_x2": 223.003, "r_y2": 704.514, "r_x3": 152.159, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "As shown in Tab.", "orig": "As shown in Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.094, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 228.094, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "3, we evaluate", "orig": "3, we evaluate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Cell Detection. Like any object detector, our Cell BBox Detector provides bounding boxes that can be improved with post-processing during inference. We make use of the grid-like structure of tables to refine the predictions. A detailed explanation on the post-processing is available in the supplementary material. As shown in Tab. 3, we evaluate"}, {"label": "text", "id": 7, "page_no": 6, "cluster": {"id": 7, "label": "text", "bbox": {"l": 308.862, "t": 75.298, "r": 545.115, "b": 227.49099999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9713197946548462, "cells": [{"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 322.142, "r_y1": 84.029, "r_x2": 322.142, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 325.454, "r_y0": 83.88599999999997, "r_x1": 404.567, "r_y1": 83.88599999999997, "r_x2": 404.567, "r_y2": 75.298, "r_x3": 325.454, "r_y3": 75.298, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.104, "r_y0": 84.029, "r_x1": 545.11, "r_y1": 84.029, "r_x2": 545.11, "r_y2": 75.47699999999998, "r_x3": 408.104, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "accuracy for cells with a class la-", "orig": "accuracy for cells with a class la-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 95.98400000000004, "r_x1": 545.115, "r_y1": 95.98400000000004, "r_x2": 545.115, "r_y2": 87.43200000000002, "r_x3": 308.862, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "bel of 'content' only using the PASCAL VOC mAP metric", "orig": "bel of 'content' only using the PASCAL VOC mAP metric", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 107.93899999999996, "r_x1": 320.478, "r_y1": 107.93899999999996, "r_x2": 320.478, "r_y2": 99.38699999999994, "r_x3": 308.862, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 324.374, "r_y0": 107.93899999999996, "r_x1": 470.226, "r_y1": 107.93899999999996, "r_x2": 470.226, "r_y2": 99.38699999999994, "r_x3": 324.374, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "pre-processing and post-processing.", "orig": "pre-processing and post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.529, "r_y0": 107.93899999999996, "r_x1": 545.115, "r_y1": 107.93899999999996, "r_x2": 545.115, "r_y2": 99.38699999999994, "r_x3": 477.529, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "Note that we do", "orig": "Note that we do", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 119.894, "r_x1": 545.115, "r_y1": 119.894, "r_x2": 545.115, "r_y2": 111.34199999999998, "r_x3": 308.862, "r_y3": 111.34199999999998, "coord_origin": "TOPLEFT"}, "text": "not have post-processing results for SynthTabNet as images", "orig": "not have post-processing results for SynthTabNet as images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 131.84900000000005, "r_x1": 545.115, "r_y1": 131.84900000000005, "r_x2": 545.115, "r_y2": 123.29700000000003, "r_x3": 308.862, "r_y3": 123.29700000000003, "coord_origin": "TOPLEFT"}, "text": "are only provided. To compare the performance of our pro-", "orig": "are only provided. To compare the performance of our pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 143.80499999999995, "r_x1": 502.017, "r_y1": 143.80499999999995, "r_x2": 502.017, "r_y2": 135.25300000000004, "r_x3": 308.862, "r_y3": 135.25300000000004, "coord_origin": "TOPLEFT"}, "text": "posed approach, we've integrated TableFormer's", "orig": "posed approach, we've integrated TableFormer's", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 504.473, "r_y0": 143.66200000000003, "r_x1": 545.11, "r_y1": 143.66200000000003, "r_x2": 545.11, "r_y2": 135.07399999999996, "r_x3": 504.473, "r_y3": 135.07399999999996, "coord_origin": "TOPLEFT"}, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 155.61699999999996, "r_x1": 343.163, "r_y1": 155.61699999999996, "r_x2": 343.163, "r_y2": 147.029, "r_x3": 308.862, "r_y3": 147.029, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.371, "r_y0": 155.76, "r_x1": 437.818, "r_y1": 155.76, "r_x2": 437.818, "r_y2": 147.20799999999997, "r_x3": 346.371, "r_y3": 147.20799999999997, "coord_origin": "TOPLEFT"}, "text": "into EDD architecture.", "orig": "into EDD architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.371, "r_y0": 155.76, "r_x1": 545.115, "r_y1": 155.76, "r_x2": 545.115, "r_y2": 147.20799999999997, "r_x3": 442.371, "r_y3": 147.20799999999997, "coord_origin": "TOPLEFT"}, "text": "As mentioned previously,", "orig": "As mentioned previously,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 167.71500000000003, "r_x1": 446.157, "r_y1": 167.71500000000003, "r_x2": 446.157, "r_y2": 159.163, "r_x3": 308.862, "r_y3": 159.163, "coord_origin": "TOPLEFT"}, "text": "the Structure Decoder provides the", "orig": "the Structure Decoder provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.29, "r_y0": 167.572, "r_x1": 525.042, "r_y1": 167.572, "r_x2": 525.042, "r_y2": 158.98400000000004, "r_x3": 448.29, "r_y3": 158.98400000000004, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 527.399, "r_y0": 167.71500000000003, "r_x1": 545.113, "r_y1": 167.71500000000003, "r_x2": 545.113, "r_y2": 159.163, "r_x3": 527.399, "r_y3": 159.163, "coord_origin": "TOPLEFT"}, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 179.66999999999996, "r_x1": 545.115, "r_y1": 179.66999999999996, "r_x2": 545.115, "r_y2": 171.11800000000005, "r_x3": 308.862, "r_y3": 171.11800000000005, "coord_origin": "TOPLEFT"}, "text": "the features needed to predict the bounding box predictions.", "orig": "the features needed to predict the bounding box predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 191.625, "r_x1": 432.866, "r_y1": 191.625, "r_x2": 432.866, "r_y2": 183.07299999999998, "r_x3": 308.862, "r_y3": 183.07299999999998, "coord_origin": "TOPLEFT"}, "text": "Therefore, the accuracy of the", "orig": "Therefore, the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.39, "r_y0": 191.48199999999997, "r_x1": 510.93, "r_y1": 191.48199999999997, "r_x2": 510.93, "r_y2": 182.894, "r_x3": 436.39, "r_y3": 182.894, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 514.677, "r_y0": 191.625, "r_x1": 545.113, "r_y1": 191.625, "r_x2": 545.113, "r_y2": 183.07299999999998, "r_x3": 514.677, "r_y3": 183.07299999999998, "coord_origin": "TOPLEFT"}, "text": "directly", "orig": "directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 203.58000000000004, "r_x1": 431.173, "r_y1": 203.58000000000004, "r_x2": 431.173, "r_y2": 195.02800000000002, "r_x3": 308.862, "r_y3": 195.02800000000002, "coord_origin": "TOPLEFT"}, "text": "influences the accuracy of the", "orig": "influences the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 434.679, "r_y0": 203.437, "r_x1": 514.181, "r_y1": 203.437, "r_x2": 514.181, "r_y2": 194.84900000000005, "r_x3": 434.679, "r_y3": 194.84900000000005, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 514.176, "r_y0": 203.58000000000004, "r_x1": 516.667, "r_y1": 203.58000000000004, "r_x2": 516.667, "r_y2": 195.02800000000002, "r_x3": 514.176, "r_y3": 195.02800000000002, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 522.794, "r_y0": 203.58000000000004, "r_x1": 529.429, "r_y1": 203.58000000000004, "r_x2": 529.429, "r_y2": 195.02800000000002, "r_x3": 522.794, "r_y3": 195.02800000000002, "coord_origin": "TOPLEFT"}, "text": "If", "orig": "If", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.936, "r_y0": 203.58000000000004, "r_x1": 545.11, "r_y1": 203.58000000000004, "r_x2": 545.11, "r_y2": 195.02800000000002, "r_x3": 532.936, "r_y3": 195.02800000000002, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 215.39300000000003, "r_x1": 382.356, "r_y1": 215.39300000000003, "r_x2": 382.356, "r_y2": 206.80499999999995, "r_x3": 308.862, "r_y3": 206.80499999999995, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.075, "r_y0": 215.53599999999994, "r_x1": 545.114, "r_y1": 215.53599999999994, "r_x2": 545.114, "r_y2": 206.98400000000004, "r_x3": 385.075, "r_y3": 206.98400000000004, "coord_origin": "TOPLEFT"}, "text": "predicts an extra column, this will result", "orig": "predicts an extra column, this will result", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 227.49099999999999, "r_x1": 501.698, "r_y1": 227.49099999999999, "r_x2": 501.698, "r_y2": 218.93899999999996, "r_x3": 308.862, "r_y3": 218.93899999999996, "coord_origin": "TOPLEFT"}, "text": "in an extra column of predicted bounding boxes.", "orig": "in an extra column of predicted bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "our Cell BBox Decoder accuracy for cells with a class label of 'content' only using the PASCAL VOC mAP metric for pre-processing and post-processing. Note that we do not have post-processing results for SynthTabNet as images are only provided. To compare the performance of our proposed approach, we've integrated TableFormer's Cell BBox Decoder into EDD architecture. As mentioned previously, the Structure Decoder provides the Cell BBox Decoder with the features needed to predict the bounding box predictions. Therefore, the accuracy of the Structure Decoder directly influences the accuracy of the Cell BBox Decoder . If the Structure Decoder predicts an extra column, this will result in an extra column of predicted bounding boxes."}, {"label": "table", "id": 8, "page_no": 6, "cluster": {"id": 8, "label": "table", "bbox": {"l": 308.4068603515625, "t": 247.87631225585938, "r": 533.6419677734375, "b": 303.8056640625, "coord_origin": "TOPLEFT"}, "confidence": 0.9691730737686157, "cells": [{"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.323, "r_y0": 262.485, "r_x1": 365.335, "r_y1": 262.485, "r_x2": 365.335, "r_y2": 253.933, "r_x3": 339.323, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.041, "r_y0": 262.485, "r_x1": 430.919, "r_y1": 262.485, "r_x2": 430.919, "r_y2": 253.933, "r_x3": 401.041, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.102, "r_y0": 262.485, "r_x1": 474.585, "r_y1": 262.485, "r_x2": 474.585, "r_y2": 253.933, "r_x3": 454.102, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 486.54, "r_y0": 262.485, "r_x1": 527.228, "r_y1": 262.485, "r_x2": 527.228, "r_y2": 253.933, "r_x3": 486.54, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.656, "r_y0": 279.442, "r_x1": 377.001, "r_y1": 279.442, "r_x2": 377.001, "r_y2": 270.89, "r_x3": 327.656, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.698, "r_y0": 279.442, "r_x1": 438.281, "r_y1": 279.442, "r_x2": 438.281, "r_y2": 270.89, "r_x3": 393.698, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.636, "r_y0": 279.442, "r_x1": 473.07, "r_y1": 279.442, "r_x2": 473.07, "r_y2": 270.89, "r_x3": 455.636, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.166, "r_y0": 279.442, "r_x1": 515.6, "r_y1": 279.442, "r_x2": 515.6, "r_y2": 270.89, "r_x3": 498.166, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 291.397, "r_x1": 377.863, "r_y1": 291.397, "r_x2": 377.863, "r_y2": 282.845, "r_x3": 326.795, "r_y3": 282.845, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.694, "r_y0": 291.397, "r_x1": 438.276, "r_y1": 291.397, "r_x2": 438.276, "r_y2": 282.845, "r_x3": 393.694, "r_y3": 282.845, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.631, "r_y0": 291.413, "r_x1": 473.066, "r_y1": 291.413, "r_x2": 473.066, "r_y2": 282.457, "r_x3": 455.631, "r_y3": 282.457, "coord_origin": "TOPLEFT"}, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.171, "r_y0": 291.413, "r_x1": 515.606, "r_y1": 291.413, "r_x2": 515.606, "r_y2": 282.457, "r_x3": 498.171, "r_y3": 282.457, "coord_origin": "TOPLEFT"}, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 303.352, "r_x1": 377.863, "r_y1": 303.352, "r_x2": 377.863, "r_y2": 294.8, "r_x3": 326.795, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 389.818, "r_y0": 303.352, "r_x1": 442.152, "r_y1": 303.352, "r_x2": 442.152, "r_y2": 294.8, "r_x3": 389.818, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.631, "r_y0": 303.352, "r_x1": 473.066, "r_y1": 303.352, "r_x2": 473.066, "r_y2": 294.8, "r_x3": 455.631, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 505.225, "r_y0": 303.352, "r_x1": 508.543, "r_y1": 303.352, "r_x2": 508.543, "r_y2": 294.8, "r_x3": 505.225, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 83, "label": "text", "bbox": {"l": 339.323, "t": 253.933, "r": 365.335, "b": 262.485, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.323, "r_y0": 262.485, "r_x1": 365.335, "r_y1": 262.485, "r_x2": 365.335, "r_y2": 253.933, "r_x3": 339.323, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 401.041, "t": 253.933, "r": 430.919, "b": 262.485, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.041, "r_y0": 262.485, "r_x1": 430.919, "r_y1": 262.485, "r_x2": 430.919, "r_y2": 253.933, "r_x3": 401.041, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 454.102, "t": 253.933, "r": 474.585, "b": 262.485, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.102, "r_y0": 262.485, "r_x1": 474.585, "r_y1": 262.485, "r_x2": 474.585, "r_y2": 253.933, "r_x3": 454.102, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 86, "label": "text", "bbox": {"l": 486.54, "t": 253.933, "r": 527.228, "b": 262.485, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 486.54, "r_y0": 262.485, "r_x1": 527.228, "r_y1": 262.485, "r_x2": 527.228, "r_y2": 253.933, "r_x3": 486.54, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 327.656, "t": 270.89, "r": 377.001, "b": 279.442, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.656, "r_y0": 279.442, "r_x1": 377.001, "r_y1": 279.442, "r_x2": 377.001, "r_y2": 270.89, "r_x3": 327.656, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 88, "label": "text", "bbox": {"l": 393.698, "t": 270.89, "r": 438.281, "b": 279.442, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.698, "r_y0": 279.442, "r_x1": 438.281, "r_y1": 279.442, "r_x2": 438.281, "r_y2": 270.89, "r_x3": 393.698, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 455.636, "t": 270.89, "r": 473.07, "b": 279.442, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.636, "r_y0": 279.442, "r_x1": 473.07, "r_y1": 279.442, "r_x2": 473.07, "r_y2": 270.89, "r_x3": 455.636, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 498.166, "t": 270.89, "r": 515.6, "b": 279.442, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.166, "r_y0": 279.442, "r_x1": 515.6, "r_y1": 279.442, "r_x2": 515.6, "r_y2": 270.89, "r_x3": 498.166, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 91, "label": "text", "bbox": {"l": 326.795, "t": 282.845, "r": 377.863, "b": 291.397, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 291.397, "r_x1": 377.863, "r_y1": 291.397, "r_x2": 377.863, "r_y2": 282.845, "r_x3": 326.795, "r_y3": 282.845, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 92, "label": "text", "bbox": {"l": 393.694, "t": 282.845, "r": 438.276, "b": 291.397, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.694, "r_y0": 291.397, "r_x1": 438.276, "r_y1": 291.397, "r_x2": 438.276, "r_y2": 282.845, "r_x3": 393.694, "r_y3": 282.845, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 93, "label": "text", "bbox": {"l": 455.631, "t": 282.457, "r": 473.066, "b": 291.413, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.631, "r_y0": 291.413, "r_x1": 473.066, "r_y1": 291.413, "r_x2": 473.066, "r_y2": 282.457, "r_x3": 455.631, "r_y3": 282.457, "coord_origin": "TOPLEFT"}, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 94, "label": "text", "bbox": {"l": 498.171, "t": 282.457, "r": 515.606, "b": 291.413, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.171, "r_y0": 291.413, "r_x1": 515.606, "r_y1": 291.413, "r_x2": 515.606, "r_y2": 282.457, "r_x3": 498.171, "r_y3": 282.457, "coord_origin": "TOPLEFT"}, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 95, "label": "text", "bbox": {"l": 326.795, "t": 294.8, "r": 377.863, "b": 303.352, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 303.352, "r_x1": 377.863, "r_y1": 303.352, "r_x2": 377.863, "r_y2": 294.8, "r_x3": 326.795, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 96, "label": "text", "bbox": {"l": 389.818, "t": 294.8, "r": 442.152, "b": 303.352, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 389.818, "r_y0": 303.352, "r_x1": 442.152, "r_y1": 303.352, "r_x2": 442.152, "r_y2": 294.8, "r_x3": 389.818, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 97, "label": "text", "bbox": {"l": 455.631, "t": 294.8, "r": 473.066, "b": 303.352, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.631, "r_y0": 303.352, "r_x1": 473.066, "r_y1": 303.352, "r_x2": 473.066, "r_y2": 294.8, "r_x3": 455.631, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 98, "label": "text", "bbox": {"l": 505.225, "t": 294.8, "r": 508.543, "b": 303.352, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 505.225, "r_y0": 303.352, "r_x1": 508.543, "r_y1": 303.352, "r_x2": 508.543, "r_y2": 294.8, "r_x3": 505.225, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 4, "num_cols": 4, "table_cells": [{"bbox": {"l": 339.323, "t": 253.933, "r": 365.335, "b": 262.485, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 401.041, "t": 253.933, "r": 430.919, "b": 262.485, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Dataset", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 454.102, "t": 253.933, "r": 474.585, "b": 262.485, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "mAP", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 486.54, "t": 253.933, "r": 527.228, "b": 262.485, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "mAP (PP)", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 327.656, "t": 270.89, "r": 377.001, "b": 279.442, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD+BBox", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 393.698, "t": 270.89, "r": 438.281, "b": 279.442, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 455.636, "t": 270.89, "r": 473.07, "b": 279.442, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "79.2", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 498.166, "t": 270.89, "r": 515.6, "b": 279.442, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "82.7", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 326.795, "t": 282.845, "r": 377.863, "b": 291.397, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 393.694, "t": 282.845, "r": 438.276, "b": 291.397, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 455.631, "t": 282.457, "r": 473.066, "b": 291.413, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "82.1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 498.171, "t": 282.457, "r": 515.606, "b": 291.413, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "86.8", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 326.795, "t": 294.8, "r": 377.863, "b": 303.352, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 389.818, "t": 294.8, "r": 442.152, "b": 303.352, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "SynthTabNet", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 455.631, "t": 294.8, "r": 473.066, "b": 303.352, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "87.7", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 505.225, "t": 294.8, "r": 508.543, "b": 303.352, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false}]}, {"label": "caption", "id": 12, "page_no": 6, "cluster": {"id": 12, "label": "caption", "bbox": {"l": 308.862, "t": 316.718, "r": 545.115, "b": 337.225, "coord_origin": "TOPLEFT"}, "confidence": 0.9519917964935303, "cells": [{"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 325.27, "r_x1": 341.499, "r_y1": 325.27, "r_x2": 341.499, "r_y2": 316.718, "r_x3": 308.862, "r_y3": 316.718, "coord_origin": "TOPLEFT"}, "text": "Table 3:", "orig": "Table 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.603, "r_y0": 325.27, "r_x1": 545.115, "r_y1": 325.27, "r_x2": 545.115, "r_y2": 316.718, "r_x3": 348.603, "r_y3": 316.718, "coord_origin": "TOPLEFT"}, "text": "Cell Bounding Box detection results on PubTab-", "orig": "Cell Bounding Box detection results on PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 337.225, "r_x1": 474.978, "r_y1": 337.225, "r_x2": 474.978, "r_y2": 328.673, "r_x3": 308.862, "r_y3": 328.673, "coord_origin": "TOPLEFT"}, "text": "Net, and FinTabNet. PP: Post-processing.", "orig": "Net, and FinTabNet. PP: Post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table 3: Cell Bounding Box detection results on PubTabNet, and FinTabNet. PP: Post-processing."}, {"label": "text", "id": 4, "page_no": 6, "cluster": {"id": 4, "label": "text", "bbox": {"l": 308.862, "t": 367.68, "r": 545.116, "b": 520.082, "coord_origin": "TOPLEFT"}, "confidence": 0.9835010766983032, "cells": [{"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 376.636, "r_x1": 378.949, "r_y1": 376.636, "r_x2": 378.949, "r_y2": 367.68, "r_x3": 320.817, "r_y3": 367.68, "coord_origin": "TOPLEFT"}, "text": "Cell Content.", "orig": "Cell Content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 387.079, "r_y0": 376.62, "r_x1": 395.378, "r_y1": 376.62, "r_x2": 395.378, "r_y2": 368.068, "r_x3": 387.079, "r_y3": 368.068, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 399.552, "r_y0": 376.62, "r_x1": 413.948, "r_y1": 376.62, "r_x2": 413.948, "r_y2": 368.068, "r_x3": 399.552, "r_y3": 368.068, "coord_origin": "TOPLEFT"}, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.112, "r_y0": 376.62, "r_x1": 448.827, "r_y1": 376.62, "r_x2": 448.827, "r_y2": 368.068, "r_x3": 418.112, "r_y3": 368.068, "coord_origin": "TOPLEFT"}, "text": "section,", "orig": "section,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.42, "r_y0": 376.62, "r_x1": 545.116, "r_y1": 376.62, "r_x2": 545.116, "r_y2": 368.068, "r_x3": 453.42, "r_y3": 368.068, "coord_origin": "TOPLEFT"}, "text": "we evaluate the entire", "orig": "we evaluate the entire", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 388.575, "r_x1": 487.193, "r_y1": 388.575, "r_x2": 487.193, "r_y2": 380.023, "r_x3": 308.862, "r_y3": 380.023, "coord_origin": "TOPLEFT"}, "text": "pipeline of recovering a table with content.", "orig": "pipeline of recovering a table with content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.967, "r_y0": 388.575, "r_x1": 545.115, "r_y1": 388.575, "r_x2": 545.115, "r_y2": 380.023, "r_x3": 493.967, "r_y3": 380.023, "coord_origin": "TOPLEFT"}, "text": "Here we put", "orig": "Here we put", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 400.53, "r_x1": 545.115, "r_y1": 400.53, "r_x2": 545.115, "r_y2": 391.978, "r_x3": 308.862, "r_y3": 391.978, "coord_origin": "TOPLEFT"}, "text": "our approach to test by capitalizing on extracting content", "orig": "our approach to test by capitalizing on extracting content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 412.486, "r_x1": 545.115, "r_y1": 412.486, "r_x2": 545.115, "r_y2": 403.934, "r_x3": 308.862, "r_y3": 403.934, "coord_origin": "TOPLEFT"}, "text": "from the PDF cells rather than decoding from images. Tab.", "orig": "from the PDF cells rather than decoding from images. Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 424.441, "r_x1": 545.115, "r_y1": 424.441, "r_x2": 545.115, "r_y2": 415.889, "r_x3": 308.862, "r_y3": 415.889, "coord_origin": "TOPLEFT"}, "text": "4 shows the TEDs score of HTML code representing the", "orig": "4 shows the TEDs score of HTML code representing the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 436.396, "r_x1": 545.115, "r_y1": 436.396, "r_x2": 545.115, "r_y2": 427.844, "r_x3": 308.862, "r_y3": 427.844, "coord_origin": "TOPLEFT"}, "text": "structure of the table along with the content inserted in the", "orig": "structure of the table along with the content inserted in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 203, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 448.351, "r_x1": 545.115, "r_y1": 448.351, "r_x2": 545.115, "r_y2": 439.799, "r_x3": 308.862, "r_y3": 439.799, "coord_origin": "TOPLEFT"}, "text": "data cell and compared with the ground-truth. Our method", "orig": "data cell and compared with the ground-truth. Our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 204, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 460.306, "r_x1": 350.237, "r_y1": 460.306, "r_x2": 350.237, "r_y2": 451.754, "r_x3": 308.862, "r_y3": 451.754, "coord_origin": "TOPLEFT"}, "text": "achieved a", "orig": "achieved a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 205, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 352.176, "r_y0": 460.322, "r_x1": 374.592, "r_y1": 460.322, "r_x2": 374.592, "r_y2": 451.366, "r_x3": 352.176, "r_y3": 451.366, "coord_origin": "TOPLEFT"}, "text": "5.3%", "orig": "5.3%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 206, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.533, "r_y0": 460.306, "r_x1": 545.11, "r_y1": 460.306, "r_x2": 545.11, "r_y2": 451.754, "r_x3": 376.533, "r_y3": 451.754, "coord_origin": "TOPLEFT"}, "text": "increase over the state-of-the-art, and com-", "orig": "increase over the state-of-the-art, and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 207, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 472.261, "r_x1": 380.523, "r_y1": 472.261, "r_x2": 380.523, "r_y2": 463.709, "r_x3": 308.862, "r_y3": 463.709, "coord_origin": "TOPLEFT"}, "text": "mercial solutions.", "orig": "mercial solutions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 208, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.042, "r_y0": 472.261, "r_x1": 545.115, "r_y1": 472.261, "r_x2": 545.115, "r_y2": 463.709, "r_x3": 386.042, "r_y3": 463.709, "coord_origin": "TOPLEFT"}, "text": "We believe our scores would be higher", "orig": "We believe our scores would be higher", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 209, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 484.217, "r_x1": 314.949, "r_y1": 484.217, "r_x2": 314.949, "r_y2": 475.665, "r_x3": 308.862, "r_y3": 475.665, "coord_origin": "TOPLEFT"}, "text": "if", "orig": "if", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 210, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.008, "r_y0": 484.217, "r_x1": 545.115, "r_y1": 484.217, "r_x2": 545.115, "r_y2": 475.665, "r_x3": 318.008, "r_y3": 475.665, "coord_origin": "TOPLEFT"}, "text": "the HTML ground-truth matched the extracted PDF cell", "orig": "the HTML ground-truth matched the extracted PDF cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 211, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 496.172, "r_x1": 340.683, "r_y1": 496.172, "r_x2": 340.683, "r_y2": 487.62, "r_x3": 308.862, "r_y3": 487.62, "coord_origin": "TOPLEFT"}, "text": "content.", "orig": "content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 212, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.793, "r_y0": 496.172, "r_x1": 545.115, "r_y1": 496.172, "r_x2": 545.115, "r_y2": 487.62, "r_x3": 345.793, "r_y3": 487.62, "coord_origin": "TOPLEFT"}, "text": "Unfortunately, there are small discrepancies such", "orig": "Unfortunately, there are small discrepancies such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 213, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 508.127, "r_x1": 545.115, "r_y1": 508.127, "r_x2": 545.115, "r_y2": 499.575, "r_x3": 308.862, "r_y3": 499.575, "coord_origin": "TOPLEFT"}, "text": "as spacings around words or special characters with various", "orig": "as spacings around words or special characters with various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 214, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 520.082, "r_x1": 405.698, "r_y1": 520.082, "r_x2": 405.698, "r_y2": 511.53, "r_x3": 308.862, "r_y3": 511.53, "coord_origin": "TOPLEFT"}, "text": "unicode representations.", "orig": "unicode representations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Cell Content. In this section, we evaluate the entire pipeline of recovering a table with content. Here we put our approach to test by capitalizing on extracting content from the PDF cells rather than decoding from images. Tab. 4 shows the TEDs score of HTML code representing the structure of the table along with the content inserted in the data cell and compared with the ground-truth. Our method achieved a 5.3% increase over the state-of-the-art, and commercial solutions. We believe our scores would be higher if the HTML ground-truth matched the extracted PDF cell content. Unfortunately, there are small discrepancies such as spacings around words or special characters with various unicode representations."}, {"label": "table", "id": 5, "page_no": 6, "cluster": {"id": 5, "label": "table", "bbox": {"l": 332.9688720703125, "t": 540.2835693359375, "r": 520.942138671875, "b": 643.2697143554688, "coord_origin": "TOPLEFT"}, "confidence": 0.9775567650794983, "cells": [{"index": 215, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 358.011, "r_y0": 561.054, "r_x1": 384.023, "r_y1": 561.054, "r_x2": 384.023, "r_y2": 552.502, "r_x3": 358.011, "r_y3": 552.502, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 216, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.034, "r_y0": 555.076, "r_x1": 473.94, "r_y1": 555.076, "r_x2": 473.94, "r_y2": 546.524, "r_x3": 449.034, "r_y3": 546.524, "coord_origin": "TOPLEFT"}, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 217, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.506, "r_y0": 567.031, "r_x1": 436.74, "r_y1": 567.031, "r_x2": 436.74, "r_y2": 558.479, "r_x3": 408.506, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 218, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.695, "r_y0": 567.031, "r_x1": 485.079, "r_y1": 567.031, "r_x2": 485.079, "r_y2": 558.479, "r_x3": 448.695, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 219, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 499.385, "r_y0": 567.031, "r_x1": 512.117, "r_y1": 567.031, "r_x2": 512.117, "r_y2": 558.479, "r_x3": 499.385, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 220, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.682, "r_y0": 583.988, "r_x1": 384.352, "r_y1": 583.988, "r_x2": 384.352, "r_y2": 575.436, "r_x3": 357.682, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 221, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.901, "r_y0": 583.988, "r_x1": 431.336, "r_y1": 583.988, "r_x2": 431.336, "r_y2": 575.436, "r_x3": 413.901, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 222, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 583.988, "r_x1": 475.599, "r_y1": 583.988, "r_x2": 475.599, "r_y2": 575.436, "r_x3": 458.165, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 223, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.029, "r_y0": 583.988, "r_x1": 514.463, "r_y1": 583.988, "r_x2": 514.463, "r_y2": 575.436, "r_x3": 497.029, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 224, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 350.723, "r_y0": 595.943, "r_x1": 391.311, "r_y1": 595.943, "r_x2": 391.311, "r_y2": 587.391, "r_x3": 350.723, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 225, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 595.943, "r_x1": 431.34, "r_y1": 595.943, "r_x2": 431.34, "r_y2": 587.391, "r_x3": 413.906, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 226, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 595.943, "r_x1": 475.604, "r_y1": 595.943, "r_x2": 475.604, "r_y2": 587.391, "r_x3": 458.17, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 227, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 595.943, "r_x1": 514.468, "r_y1": 595.943, "r_x2": 514.468, "r_y2": 587.391, "r_x3": 497.034, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 228, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.136, "r_y0": 607.899, "r_x1": 387.899, "r_y1": 607.899, "r_x2": 387.899, "r_y2": 599.347, "r_x3": 354.136, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 229, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.902, "r_y0": 607.899, "r_x1": 431.336, "r_y1": 607.899, "r_x2": 431.336, "r_y2": 599.347, "r_x3": 413.902, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 230, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 607.899, "r_x1": 475.6, "r_y1": 607.899, "r_x2": 475.6, "r_y2": 599.347, "r_x3": 458.165, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 231, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.03, "r_y0": 607.899, "r_x1": 514.464, "r_y1": 607.899, "r_x2": 514.464, "r_y2": 599.347, "r_x3": 497.03, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 232, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.559, "r_y0": 619.854, "r_x1": 395.475, "r_y1": 619.854, "r_x2": 395.475, "r_y2": 611.302, "r_x3": 346.559, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 233, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 619.854, "r_x1": 431.341, "r_y1": 619.854, "r_x2": 431.341, "r_y2": 611.302, "r_x3": 413.906, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 234, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 619.854, "r_x1": 475.605, "r_y1": 619.854, "r_x2": 475.605, "r_y2": 611.302, "r_x3": 458.17, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 235, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 619.854, "r_x1": 514.469, "r_y1": 619.854, "r_x2": 514.469, "r_y2": 611.302, "r_x3": 497.034, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 236, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.781, "r_y0": 631.809, "r_x1": 381.254, "r_y1": 631.809, "r_x2": 381.254, "r_y2": 623.2570000000001, "r_x3": 360.781, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 237, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.902, "r_y0": 631.809, "r_x1": 431.336, "r_y1": 631.809, "r_x2": 431.336, "r_y2": 623.2570000000001, "r_x3": 413.902, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 238, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 631.809, "r_x1": 475.6, "r_y1": 631.809, "r_x2": 475.6, "r_y2": 623.2570000000001, "r_x3": 458.165, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 239, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.03, "r_y0": 631.809, "r_x1": 514.464, "r_y1": 631.809, "r_x2": 514.464, "r_y2": 623.2570000000001, "r_x3": 497.03, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 240, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.483, "r_y0": 643.764, "r_x1": 396.551, "r_y1": 643.764, "r_x2": 396.551, "r_y2": 635.212, "r_x3": 345.483, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 241, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 643.764, "r_x1": 431.341, "r_y1": 643.764, "r_x2": 431.341, "r_y2": 635.212, "r_x3": 413.906, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 242, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 643.764, "r_x1": 475.605, "r_y1": 643.764, "r_x2": 475.605, "r_y2": 635.212, "r_x3": 458.17, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 243, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 643.78, "r_x1": 514.469, "r_y1": 643.78, "r_x2": 514.469, "r_y2": 634.8240000000001, "r_x3": 497.034, "r_y3": 634.8240000000001, "coord_origin": "TOPLEFT"}, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 99, "label": "text", "bbox": {"l": 358.011, "t": 552.502, "r": 384.023, "b": 561.054, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 215, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 358.011, "r_y0": 561.054, "r_x1": 384.023, "r_y1": 561.054, "r_x2": 384.023, "r_y2": 552.502, "r_x3": 358.011, "r_y3": 552.502, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 100, "label": "text", "bbox": {"l": 449.034, "t": 546.524, "r": 473.94, "b": 555.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 216, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.034, "r_y0": 555.076, "r_x1": 473.94, "r_y1": 555.076, "r_x2": 473.94, "r_y2": 546.524, "r_x3": 449.034, "r_y3": 546.524, "coord_origin": "TOPLEFT"}, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 101, "label": "text", "bbox": {"l": 408.506, "t": 558.479, "r": 436.74, "b": 567.031, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 217, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.506, "r_y0": 567.031, "r_x1": 436.74, "r_y1": 567.031, "r_x2": 436.74, "r_y2": 558.479, "r_x3": 408.506, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 102, "label": "text", "bbox": {"l": 448.695, "t": 558.479, "r": 485.079, "b": 567.031, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 218, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.695, "r_y0": 567.031, "r_x1": 485.079, "r_y1": 567.031, "r_x2": 485.079, "r_y2": 558.479, "r_x3": 448.695, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 103, "label": "text", "bbox": {"l": 499.385, "t": 558.479, "r": 512.117, "b": 567.031, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 219, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 499.385, "r_y0": 567.031, "r_x1": 512.117, "r_y1": 567.031, "r_x2": 512.117, "r_y2": 558.479, "r_x3": 499.385, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 104, "label": "text", "bbox": {"l": 357.682, "t": 575.436, "r": 384.352, "b": 583.988, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 220, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.682, "r_y0": 583.988, "r_x1": 384.352, "r_y1": 583.988, "r_x2": 384.352, "r_y2": 575.436, "r_x3": 357.682, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 105, "label": "text", "bbox": {"l": 413.901, "t": 575.436, "r": 431.336, "b": 583.988, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 221, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.901, "r_y0": 583.988, "r_x1": 431.336, "r_y1": 583.988, "r_x2": 431.336, "r_y2": 575.436, "r_x3": 413.901, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 106, "label": "text", "bbox": {"l": 458.165, "t": 575.436, "r": 475.599, "b": 583.988, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 222, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 583.988, "r_x1": 475.599, "r_y1": 583.988, "r_x2": 475.599, "r_y2": 575.436, "r_x3": 458.165, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 107, "label": "text", "bbox": {"l": 497.029, "t": 575.436, "r": 514.463, "b": 583.988, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 223, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.029, "r_y0": 583.988, "r_x1": 514.463, "r_y1": 583.988, "r_x2": 514.463, "r_y2": 575.436, "r_x3": 497.029, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 108, "label": "text", "bbox": {"l": 350.723, "t": 587.391, "r": 391.311, "b": 595.943, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 224, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 350.723, "r_y0": 595.943, "r_x1": 391.311, "r_y1": 595.943, "r_x2": 391.311, "r_y2": 587.391, "r_x3": 350.723, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 109, "label": "text", "bbox": {"l": 413.906, "t": 587.391, "r": 431.34, "b": 595.943, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 225, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 595.943, "r_x1": 431.34, "r_y1": 595.943, "r_x2": 431.34, "r_y2": 587.391, "r_x3": 413.906, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 110, "label": "text", "bbox": {"l": 458.17, "t": 587.391, "r": 475.604, "b": 595.943, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 226, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 595.943, "r_x1": 475.604, "r_y1": 595.943, "r_x2": 475.604, "r_y2": 587.391, "r_x3": 458.17, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 111, "label": "text", "bbox": {"l": 497.034, "t": 587.391, "r": 514.468, "b": 595.943, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 227, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 595.943, "r_x1": 514.468, "r_y1": 595.943, "r_x2": 514.468, "r_y2": 587.391, "r_x3": 497.034, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 112, "label": "text", "bbox": {"l": 354.136, "t": 599.347, "r": 387.899, "b": 607.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 228, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.136, "r_y0": 607.899, "r_x1": 387.899, "r_y1": 607.899, "r_x2": 387.899, "r_y2": 599.347, "r_x3": 354.136, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 113, "label": "text", "bbox": {"l": 413.902, "t": 599.347, "r": 431.336, "b": 607.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 229, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.902, "r_y0": 607.899, "r_x1": 431.336, "r_y1": 607.899, "r_x2": 431.336, "r_y2": 599.347, "r_x3": 413.902, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 114, "label": "text", "bbox": {"l": 458.165, "t": 599.347, "r": 475.6, "b": 607.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 230, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 607.899, "r_x1": 475.6, "r_y1": 607.899, "r_x2": 475.6, "r_y2": 599.347, "r_x3": 458.165, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 115, "label": "text", "bbox": {"l": 497.03, "t": 599.347, "r": 514.464, "b": 607.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 231, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.03, "r_y0": 607.899, "r_x1": 514.464, "r_y1": 607.899, "r_x2": 514.464, "r_y2": 599.347, "r_x3": 497.03, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 116, "label": "text", "bbox": {"l": 346.559, "t": 611.302, "r": 395.475, "b": 619.854, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 232, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.559, "r_y0": 619.854, "r_x1": 395.475, "r_y1": 619.854, "r_x2": 395.475, "r_y2": 611.302, "r_x3": 346.559, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 117, "label": "text", "bbox": {"l": 413.906, "t": 611.302, "r": 431.341, "b": 619.854, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 233, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 619.854, "r_x1": 431.341, "r_y1": 619.854, "r_x2": 431.341, "r_y2": 611.302, "r_x3": 413.906, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 118, "label": "text", "bbox": {"l": 458.17, "t": 611.302, "r": 475.605, "b": 619.854, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 234, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 619.854, "r_x1": 475.605, "r_y1": 619.854, "r_x2": 475.605, "r_y2": 611.302, "r_x3": 458.17, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 119, "label": "text", "bbox": {"l": 497.034, "t": 611.302, "r": 514.469, "b": 619.854, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 235, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 619.854, "r_x1": 514.469, "r_y1": 619.854, "r_x2": 514.469, "r_y2": 611.302, "r_x3": 497.034, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 120, "label": "text", "bbox": {"l": 360.781, "t": 623.2570000000001, "r": 381.254, "b": 631.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 236, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.781, "r_y0": 631.809, "r_x1": 381.254, "r_y1": 631.809, "r_x2": 381.254, "r_y2": 623.2570000000001, "r_x3": 360.781, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 121, "label": "text", "bbox": {"l": 413.902, "t": 623.2570000000001, "r": 431.336, "b": 631.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 237, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.902, "r_y0": 631.809, "r_x1": 431.336, "r_y1": 631.809, "r_x2": 431.336, "r_y2": 623.2570000000001, "r_x3": 413.902, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 122, "label": "text", "bbox": {"l": 458.165, "t": 623.2570000000001, "r": 475.6, "b": 631.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 238, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 631.809, "r_x1": 475.6, "r_y1": 631.809, "r_x2": 475.6, "r_y2": 623.2570000000001, "r_x3": 458.165, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 123, "label": "text", "bbox": {"l": 497.03, "t": 623.2570000000001, "r": 514.464, "b": 631.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 239, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.03, "r_y0": 631.809, "r_x1": 514.464, "r_y1": 631.809, "r_x2": 514.464, "r_y2": 623.2570000000001, "r_x3": 497.03, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 124, "label": "text", "bbox": {"l": 345.483, "t": 635.212, "r": 396.551, "b": 643.764, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 240, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.483, "r_y0": 643.764, "r_x1": 396.551, "r_y1": 643.764, "r_x2": 396.551, "r_y2": 635.212, "r_x3": 345.483, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 125, "label": "text", "bbox": {"l": 413.906, "t": 635.212, "r": 431.341, "b": 643.764, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 241, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 643.764, "r_x1": 431.341, "r_y1": 643.764, "r_x2": 431.341, "r_y2": 635.212, "r_x3": 413.906, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 126, "label": "text", "bbox": {"l": 458.17, "t": 635.212, "r": 475.605, "b": 643.764, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 242, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 643.764, "r_x1": 475.605, "r_y1": 643.764, "r_x2": 475.605, "r_y2": 635.212, "r_x3": 458.17, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 127, "label": "text", "bbox": {"l": 497.034, "t": 634.8240000000001, "r": 514.469, "b": 643.78, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 243, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 643.78, "r_x1": 514.469, "r_y1": 643.78, "r_x2": 514.469, "r_y2": 634.8240000000001, "r_x3": 497.034, "r_y3": 634.8240000000001, "coord_origin": "TOPLEFT"}, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["fcel", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 7, "num_cols": 4, "table_cells": [{"bbox": {"l": 358.011, "t": 552.502, "r": 384.023, "b": 561.054, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 448.695, "t": 546.524, "r": 485.079, "b": 567.031, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "TEDS Complex", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 408.506, "t": 558.479, "r": 436.74, "b": 567.031, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Simple", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 499.385, "t": 558.479, "r": 512.117, "b": 567.031, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "All", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 357.682, "t": 575.436, "r": 384.352, "b": 583.988, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Tabula", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 413.901, "t": 575.436, "r": 431.336, "b": 583.988, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "78.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 458.165, "t": 575.436, "r": 475.599, "b": 583.988, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "57.8", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 497.029, "t": 575.436, "r": 514.463, "b": 583.988, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "67.9", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 350.723, "t": 587.391, "r": 391.311, "b": 595.943, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Traprange", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 413.906, "t": 587.391, "r": 431.34, "b": 595.943, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "60.8", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 458.17, "t": 587.391, "r": 475.604, "b": 595.943, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "49.9", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 497.034, "t": 587.391, "r": 514.468, "b": 595.943, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "55.4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 354.136, "t": 599.347, "r": 387.899, "b": 607.899, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Camelot", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 413.902, "t": 599.347, "r": 431.336, "b": 607.899, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "80.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 458.165, "t": 599.347, "r": 475.6, "b": 607.899, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "66.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 497.03, "t": 599.347, "r": 514.464, "b": 607.899, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "73.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 346.559, "t": 611.302, "r": 395.475, "b": 619.854, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Acrobat Pro", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 413.906, "t": 611.302, "r": 431.341, "b": 619.854, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "68.9", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 458.17, "t": 611.302, "r": 475.605, "b": 619.854, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "61.8", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 497.034, "t": 611.302, "r": 514.469, "b": 619.854, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "65.3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 360.781, "t": 623.2570000000001, "r": 381.254, "b": 631.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 413.902, "t": 623.2570000000001, "r": 431.336, "b": 631.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "91.2", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 458.165, "t": 623.2570000000001, "r": 475.6, "b": 631.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "85.4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 497.03, "t": 623.2570000000001, "r": 514.464, "b": 631.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "88.3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 345.483, "t": 635.212, "r": 396.551, "b": 643.764, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 413.906, "t": 635.212, "r": 431.341, "b": 643.764, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "95.4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 458.17, "t": 635.212, "r": 475.605, "b": 643.764, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "90.1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 497.034, "t": 634.8240000000001, "r": 514.469, "b": 643.78, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "93.6", "column_header": false, "row_header": false, "row_section": false}]}, {"label": "caption", "id": 11, "page_no": 6, "cluster": {"id": 11, "label": "caption", "bbox": {"l": 308.862, "t": 657.13, "r": 545.115, "b": 689.592, "coord_origin": "TOPLEFT"}, "confidence": 0.9541404247283936, "cells": [{"index": 244, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 665.682, "r_x1": 341.739, "r_y1": 665.682, "r_x2": 341.739, "r_y2": 657.13, "r_x3": 308.862, "r_y3": 657.13, "coord_origin": "TOPLEFT"}, "text": "Table 4:", "orig": "Table 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 245, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 349.559, "r_y0": 665.682, "r_x1": 545.115, "r_y1": 665.682, "r_x2": 545.115, "r_y2": 657.13, "r_x3": 349.559, "r_y3": 657.13, "coord_origin": "TOPLEFT"}, "text": "Results of structure with content retrieved using", "orig": "Results of structure with content retrieved using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 246, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 677.637, "r_x1": 425.763, "r_y1": 677.637, "r_x2": 425.763, "r_y2": 669.085, "r_x3": 308.862, "r_y3": 669.085, "coord_origin": "TOPLEFT"}, "text": "cell detection on PubTabNet.", "orig": "cell detection on PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 247, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.336, "r_y0": 677.637, "r_x1": 545.115, "r_y1": 677.637, "r_x2": 545.115, "r_y2": 669.085, "r_x3": 430.336, "r_y3": 669.085, "coord_origin": "TOPLEFT"}, "text": "In all cases the input is PDF", "orig": "In all cases the input is PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 248, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.592, "r_x1": 435.038, "r_y1": 689.592, "r_x2": 435.038, "r_y2": 681.04, "r_x3": 308.862, "r_y3": 681.04, "coord_origin": "TOPLEFT"}, "text": "documents with cropped tables.", "orig": "documents with cropped tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table 4: Results of structure with content retrieved using cell detection on PubTabNet. In all cases the input is PDF documents with cropped tables."}, {"label": "page_footer", "id": 14, "page_no": 6, "cluster": {"id": 14, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8787972331047058, "cells": [{"index": 249, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "7"}], "body": [{"label": "section_header", "id": 10, "page_no": 6, "cluster": {"id": 10, "label": "section_header", "bbox": {"l": 50.112, "t": 74.40099999999995, "r": 167.898, "b": 84.25300000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9554274082183838, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.25300000000004, "r_x1": 167.898, "r_y1": 84.25300000000004, "r_x2": 167.898, "r_y2": 74.40099999999995, "r_x3": 50.112, "r_y3": 74.40099999999995, "coord_origin": "TOPLEFT"}, "text": "5.3. Datasets and Metrics", "orig": "5.3. Datasets and Metrics", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.3. Datasets and Metrics"}, {"label": "text", "id": 1, "page_no": 6, "cluster": {"id": 1, "label": "text", "bbox": {"l": 50.112, "t": 93.61900000000003, "r": 286.365, "b": 138.03700000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.9862998127937317, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 102.17100000000005, "r_x1": 286.365, "r_y1": 102.17100000000005, "r_x2": 286.365, "r_y2": 93.61900000000003, "r_x3": 62.067, "r_y3": 93.61900000000003, "coord_origin": "TOPLEFT"}, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "orig": "The Tree-Edit-Distance-Based Similarity (TEDS) met-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 114.12599999999998, "r_x1": 286.365, "r_y1": 114.12599999999998, "r_x2": 286.365, "r_y2": 105.57399999999996, "r_x3": 50.112, "r_y3": 105.57399999999996, "coord_origin": "TOPLEFT"}, "text": "ric was introduced in [37]. It represents the prediction, and", "orig": "ric was introduced in [37]. It represents the prediction, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 126.08100000000002, "r_x1": 239.999, "r_y1": 126.08100000000002, "r_x2": 239.999, "r_y2": 117.529, "r_x3": 50.112, "r_y3": 117.529, "coord_origin": "TOPLEFT"}, "text": "ground-truth as a tree structure of HTML tags.", "orig": "ground-truth as a tree structure of HTML tags.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.03, "r_y0": 126.08100000000002, "r_x1": 286.365, "r_y1": 126.08100000000002, "r_x2": 286.365, "r_y2": 117.529, "r_x3": 245.03, "r_y3": 117.529, "coord_origin": "TOPLEFT"}, "text": "This simi-", "orig": "This simi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 138.03700000000003, "r_x1": 136.717, "r_y1": 138.03700000000003, "r_x2": 136.717, "r_y2": 129.485, "r_x3": 50.112, "r_y3": 129.485, "coord_origin": "TOPLEFT"}, "text": "larity is calculated as:", "orig": "larity is calculated as:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The Tree-Edit-Distance-Based Similarity (TEDS) metric was introduced in [37]. It represents the prediction, and ground-truth as a tree structure of HTML tags. This similarity is calculated as:"}, {"label": "formula", "id": 13, "page_no": 6, "cluster": {"id": 13, "label": "formula", "bbox": {"l": 86.219, "t": 150.428, "r": 286.362, "b": 173.63199999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.9500409364700317, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.219, "r_y0": 165.87400000000002, "r_x1": 118.878, "r_y1": 165.87400000000002, "r_x2": 118.878, "r_y2": 157.168, "r_x3": 86.219, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": "TEDS(", "orig": "TEDS(", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 118.875, "r_y0": 165.87400000000002, "r_x1": 139.77, "r_y1": 165.87400000000002, "r_x2": 139.77, "r_y2": 157.168, "r_x3": 118.875, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": "T , T", "orig": "T , T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.697, "r_y0": 166.798, "r_x1": 129.019, "r_y1": 166.798, "r_x2": 129.019, "r_y2": 160.70399999999995, "r_x3": 124.697, "r_y3": 160.70399999999995, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.766, "r_y0": 166.798, "r_x1": 143.27, "r_y1": 166.798, "r_x2": 143.27, "r_y2": 160.70399999999995, "r_x3": 139.766, "r_y3": 160.70399999999995, "coord_origin": "TOPLEFT"}, "text": "b", "orig": "b", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.768, "r_y0": 165.87400000000002, "r_x1": 165.902, "r_y1": 165.87400000000002, "r_x2": 165.902, "r_y2": 157.168, "r_x3": 143.768, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": ") = 1", "orig": ") = 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.121, "r_y0": 165.73199999999997, "r_x1": 175.87, "r_y1": 165.73199999999997, "r_x2": 175.87, "r_y2": 157.168, "r_x3": 168.121, "r_y3": 157.168, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 179.279, "r_y0": 159.13400000000001, "r_x1": 221.957, "r_y1": 159.13400000000001, "r_x2": 221.957, "r_y2": 150.428, "r_x3": 179.279, "r_y3": 150.428, "coord_origin": "TOPLEFT"}, "text": "EditDist (", "orig": "EditDist (", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 221.952, "r_y0": 159.13400000000001, "r_x1": 242.848, "r_y1": 159.13400000000001, "r_x2": 242.848, "r_y2": 150.428, "r_x3": 221.952, "r_y3": 150.428, "coord_origin": "TOPLEFT"}, "text": "T , T", "orig": "T , T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.774, "r_y0": 160.058, "r_x1": 232.096, "r_y1": 160.058, "r_x2": 232.096, "r_y2": 153.96400000000006, "r_x3": 227.774, "r_y3": 153.96400000000006, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.843, "r_y0": 160.058, "r_x1": 246.347, "r_y1": 160.058, "r_x2": 246.347, "r_y2": 153.96400000000006, "r_x3": 242.843, "r_y3": 153.96400000000006, "coord_origin": "TOPLEFT"}, "text": "b", "orig": "b", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.845, "r_y0": 159.13400000000001, "r_x1": 250.719, "r_y1": 159.13400000000001, "r_x2": 250.719, "r_y2": 150.428, "r_x3": 246.845, "r_y3": 150.428, "coord_origin": "TOPLEFT"}, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.212, "r_y0": 172.70799999999997, "r_x1": 206.292, "r_y1": 172.70799999999997, "r_x2": 206.292, "r_y2": 164.00199999999995, "r_x3": 182.212, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "max(", "orig": "max(", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.289, "r_y0": 172.56600000000003, "r_x1": 209.057, "r_y1": 172.56600000000003, "r_x2": 209.057, "r_y2": 164.00199999999995, "r_x3": 206.289, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.056, "r_y0": 172.70799999999997, "r_x1": 214.878, "r_y1": 172.70799999999997, "r_x2": 214.878, "r_y2": 164.00199999999995, "r_x3": 209.056, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 214.878, "r_y0": 173.63199999999995, "r_x1": 219.2, "r_y1": 173.63199999999995, "r_x2": 219.2, "r_y2": 167.538, "r_x3": 214.878, "r_y3": 167.538, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.697, "r_y0": 172.56600000000003, "r_x1": 222.465, "r_y1": 172.56600000000003, "r_x2": 222.465, "r_y2": 164.00199999999995, "r_x3": 219.697, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.125, "r_y0": 172.70799999999997, "r_x1": 226.893, "r_y1": 172.70799999999997, "r_x2": 226.893, "r_y2": 164.00199999999995, "r_x3": 224.125, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.553, "r_y0": 172.56600000000003, "r_x1": 231.321, "r_y1": 172.56600000000003, "r_x2": 231.321, "r_y2": 164.00199999999995, "r_x3": 228.553, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 231.32, "r_y0": 172.70799999999997, "r_x1": 237.142, "r_y1": 172.70799999999997, "r_x2": 237.142, "r_y2": 164.00199999999995, "r_x3": 231.32, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 237.142, "r_y0": 173.63199999999995, "r_x1": 240.646, "r_y1": 173.63199999999995, "r_x2": 240.646, "r_y2": 167.538, "r_x3": 237.142, "r_y3": 167.538, "coord_origin": "TOPLEFT"}, "text": "b", "orig": "b", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 241.144, "r_y0": 172.56600000000003, "r_x1": 243.912, "r_y1": 172.56600000000003, "r_x2": 243.912, "r_y2": 164.00199999999995, "r_x3": 241.144, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.911, "r_y0": 172.70799999999997, "r_x1": 247.785, "r_y1": 172.70799999999997, "r_x2": 247.785, "r_y2": 164.00199999999995, "r_x3": 243.911, "r_y3": 164.00199999999995, "coord_origin": "TOPLEFT"}, "text": ")", "orig": ")", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.746, "r_y0": 166.038, "r_x1": 286.362, "r_y1": 166.038, "r_x2": 286.362, "r_y2": 157.486, "r_x3": 274.746, "r_y3": 157.486, "coord_origin": "TOPLEFT"}, "text": "(3)", "orig": "(3)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TEDS( T , T a b ) = 1 -EditDist ( T , T a b ) max( | T a | , | T b | ) (3)"}, {"label": "text", "id": 6, "page_no": 6, "cluster": {"id": 6, "label": "text", "bbox": {"l": 50.112, "t": 181.11300000000006, "r": 286.363, "b": 213.89300000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.9735319018363953, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 189.98299999999995, "r_x1": 86.406, "r_y1": 189.98299999999995, "r_x2": 86.406, "r_y2": 181.43100000000004, "r_x3": 62.067, "r_y3": 181.43100000000004, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.581, "r_y0": 189.81899999999996, "r_x1": 94.403, "r_y1": 189.81899999999996, "r_x2": 94.403, "r_y2": 181.11300000000006, "r_x3": 88.581, "r_y3": 181.11300000000006, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.403, "r_y0": 190.74199999999996, "r_x1": 98.725, "r_y1": 190.74199999999996, "r_x2": 98.725, "r_y2": 184.64800000000002, "r_x3": 94.403, "r_y3": 184.64800000000002, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.399, "r_y0": 189.98299999999995, "r_x1": 115.785, "r_y1": 189.98299999999995, "r_x2": 115.785, "r_y2": 181.43100000000004, "r_x3": 101.399, "r_y3": 181.43100000000004, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 117.961, "r_y0": 189.81899999999996, "r_x1": 123.783, "r_y1": 189.81899999999996, "r_x2": 123.783, "r_y2": 181.11300000000006, "r_x3": 117.961, "r_y3": 181.11300000000006, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 123.783, "r_y0": 190.74199999999996, "r_x1": 127.287, "r_y1": 190.74199999999996, "r_x2": 127.287, "r_y2": 184.64800000000002, "r_x3": 123.783, "r_y3": 184.64800000000002, "coord_origin": "TOPLEFT"}, "text": "b", "orig": "b", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.96, "r_y0": 189.98299999999995, "r_x1": 286.363, "r_y1": 189.98299999999995, "r_x2": 286.363, "r_y2": 181.43100000000004, "r_x3": 129.96, "r_y3": 181.43100000000004, "coord_origin": "TOPLEFT"}, "text": "represent tables in tree structure HTML", "orig": "represent tables in tree structure HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 201.938, "r_x1": 252.781, "r_y1": 201.938, "r_x2": 252.781, "r_y2": 193.38599999999997, "r_x3": 50.112, "r_y3": 193.38599999999997, "coord_origin": "TOPLEFT"}, "text": "format. EditDist denotes the tree-edit distance, and", "orig": "format. EditDist denotes the tree-edit distance, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.182, "r_y0": 201.63199999999995, "r_x1": 257.95, "r_y1": 201.63199999999995, "r_x2": 257.95, "r_y2": 193.06799999999998, "r_x3": 255.182, "r_y3": 193.06799999999998, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.949, "r_y0": 201.774, "r_x1": 263.771, "r_y1": 201.774, "r_x2": 263.771, "r_y2": 193.06799999999998, "r_x3": 257.949, "r_y3": 193.06799999999998, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.155, "r_y0": 201.63199999999995, "r_x1": 267.923, "r_y1": 201.63199999999995, "r_x2": 267.923, "r_y2": 193.06799999999998, "r_x3": 265.155, "r_y3": 193.06799999999998, "coord_origin": "TOPLEFT"}, "text": "|", "orig": "|", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.322, "r_y0": 201.938, "r_x1": 286.362, "r_y1": 201.938, "r_x2": 286.362, "r_y2": 193.38599999999997, "r_x3": 270.322, "r_y3": 193.38599999999997, "coord_origin": "TOPLEFT"}, "text": "rep-", "orig": "rep-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 213.89300000000003, "r_x1": 172.134, "r_y1": 213.89300000000003, "r_x2": 172.134, "r_y2": 205.341, "r_x3": 50.112, "r_y3": 205.341, "coord_origin": "TOPLEFT"}, "text": "resents the number of nodes in", "orig": "resents the number of nodes in", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 174.624, "r_y0": 213.72900000000004, "r_x1": 180.446, "r_y1": 213.72900000000004, "r_x2": 180.446, "r_y2": 205.02300000000002, "r_x3": 174.624, "r_y3": 205.02300000000002, "coord_origin": "TOPLEFT"}, "text": "T", "orig": "T", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.829, "r_y0": 213.89300000000003, "r_x1": 184.32, "r_y1": 213.89300000000003, "r_x2": 184.32, "r_y2": 205.341, "r_x3": 181.829, "r_y3": 205.341, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "where T a and T b represent tables in tree structure HTML format. EditDist denotes the tree-edit distance, and | T | represents the number of nodes in T ."}, {"label": "section_header", "id": 9, "page_no": 6, "cluster": {"id": 9, "label": "section_header", "bbox": {"l": 50.112, "t": 224.81899999999996, "r": 170.452, "b": 234.67100000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.9588837027549744, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 234.67100000000005, "r_x1": 170.452, "r_y1": 234.67100000000005, "r_x2": 170.452, "r_y2": 224.81899999999996, "r_x3": 50.112, "r_y3": 224.81899999999996, "coord_origin": "TOPLEFT"}, "text": "5.4. Quantitative Analysis", "orig": "5.4. Quantitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.4. Quantitative Analysis"}, {"label": "text", "id": 2, "page_no": 6, "cluster": {"id": 2, "label": "text", "bbox": {"l": 50.112, "t": 243.64999999999998, "r": 286.365, "b": 396.052, "coord_origin": "TOPLEFT"}, "confidence": 0.9855090975761414, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 252.606, "r_x1": 105.325, "r_y1": 252.606, "r_x2": 105.325, "r_y2": 243.64999999999998, "r_x3": 62.067, "r_y3": 243.64999999999998, "coord_origin": "TOPLEFT"}, "text": "Structure.", "orig": "Structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.126, "r_y0": 252.59000000000003, "r_x1": 184.684, "r_y1": 252.59000000000003, "r_x2": 184.684, "r_y2": 244.038, "r_x3": 112.126, "r_y3": 244.038, "coord_origin": "TOPLEFT"}, "text": "As shown in Tab.", "orig": "As shown in Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 191.478, "r_y0": 252.59000000000003, "r_x1": 198.95, "r_y1": 252.59000000000003, "r_x2": 198.95, "r_y2": 244.038, "r_x3": 191.478, "r_y3": 244.038, "coord_origin": "TOPLEFT"}, "text": "2,", "orig": "2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 202.995, "r_y0": 252.59000000000003, "r_x1": 286.362, "r_y1": 252.59000000000003, "r_x2": 286.362, "r_y2": 244.038, "r_x3": 202.995, "r_y3": 244.038, "coord_origin": "TOPLEFT"}, "text": "TableFormer outper-", "orig": "TableFormer outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 264.54499999999996, "r_x1": 286.365, "r_y1": 264.54499999999996, "r_x2": 286.365, "r_y2": 255.99300000000005, "r_x3": 50.112, "r_y3": 255.99300000000005, "coord_origin": "TOPLEFT"}, "text": "forms all SOTA methods across different datasets by a large", "orig": "forms all SOTA methods across different datasets by a large", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 276.5, "r_x1": 138.719, "r_y1": 276.5, "r_x2": 138.719, "r_y2": 267.948, "r_x3": 50.112, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "margin for predicting", "orig": "margin for predicting", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 142.993, "r_y0": 276.5, "r_x1": 155.168, "r_y1": 276.5, "r_x2": 155.168, "r_y2": 267.948, "r_x3": 142.993, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.432, "r_y0": 276.5, "r_x1": 178.799, "r_y1": 276.5, "r_x2": 178.799, "r_y2": 267.948, "r_x3": 159.432, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.073, "r_y0": 276.5, "r_x1": 217.932, "r_y1": 276.5, "r_x2": 217.932, "r_y2": 267.948, "r_x3": 183.073, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.206, "r_y0": 276.5, "r_x1": 286.365, "r_y1": 276.5, "r_x2": 286.365, "r_y2": 267.948, "r_x3": 222.206, "r_y3": 267.948, "coord_origin": "TOPLEFT"}, "text": "from an image.", "orig": "from an image.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 288.455, "r_x1": 286.365, "r_y1": 288.455, "r_x2": 286.365, "r_y2": 279.903, "r_x3": 50.112, "r_y3": 279.903, "coord_origin": "TOPLEFT"}, "text": "All the more, our model outperforms pre-trained methods.", "orig": "All the more, our model outperforms pre-trained methods.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 300.411, "r_x1": 286.365, "r_y1": 300.411, "r_x2": 286.365, "r_y2": 291.859, "r_x3": 50.112, "r_y3": 291.859, "coord_origin": "TOPLEFT"}, "text": "During the evaluation we do not apply any table filtering.", "orig": "During the evaluation we do not apply any table filtering.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 312.366, "r_x1": 286.365, "r_y1": 312.366, "r_x2": 286.365, "r_y2": 303.814, "r_x3": 50.112, "r_y3": 303.814, "coord_origin": "TOPLEFT"}, "text": "We also provide our baseline results on the SynthTabNet", "orig": "We also provide our baseline results on the SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 324.321, "r_x1": 80.269, "r_y1": 324.321, "r_x2": 80.269, "r_y2": 315.769, "r_x3": 50.112, "r_y3": 315.769, "coord_origin": "TOPLEFT"}, "text": "dataset.", "orig": "dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.579, "r_y0": 324.321, "r_x1": 91.666, "r_y1": 324.321, "r_x2": 91.666, "r_y2": 315.769, "r_x3": 85.579, "r_y3": 315.769, "coord_origin": "TOPLEFT"}, "text": "It", "orig": "It", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.894, "r_y0": 324.321, "r_x1": 257.812, "r_y1": 324.321, "r_x2": 257.812, "r_y2": 315.769, "r_x3": 94.894, "r_y3": 315.769, "coord_origin": "TOPLEFT"}, "text": "has been observed that large tables (e.g.", "orig": "has been observed that large tables (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.122, "r_y0": 324.321, "r_x1": 286.365, "r_y1": 324.321, "r_x2": 286.365, "r_y2": 315.769, "r_x3": 263.122, "r_y3": 315.769, "coord_origin": "TOPLEFT"}, "text": "tables", "orig": "tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 336.276, "r_x1": 286.365, "r_y1": 336.276, "r_x2": 286.365, "r_y2": 327.724, "r_x3": 50.112, "r_y3": 327.724, "coord_origin": "TOPLEFT"}, "text": "that occupy half of the page or more) yield poor predictions.", "orig": "that occupy half of the page or more) yield poor predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 348.231, "r_x1": 286.365, "r_y1": 348.231, "r_x2": 286.365, "r_y2": 339.679, "r_x3": 50.112, "r_y3": 339.679, "coord_origin": "TOPLEFT"}, "text": "We attribute this issue to the image resizing during the pre-", "orig": "We attribute this issue to the image resizing during the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 360.186, "r_x1": 115.068, "r_y1": 360.186, "r_x2": 115.068, "r_y2": 351.634, "r_x3": 50.112, "r_y3": 351.634, "coord_origin": "TOPLEFT"}, "text": "processing step,", "orig": "processing step,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.203, "r_y0": 360.186, "r_x1": 134.147, "r_y1": 360.186, "r_x2": 134.147, "r_y2": 351.634, "r_x3": 119.203, "r_y3": 351.634, "coord_origin": "TOPLEFT"}, "text": "that", "orig": "that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.952, "r_y0": 360.186, "r_x1": 286.365, "r_y1": 360.186, "r_x2": 286.365, "r_y2": 351.634, "r_x3": 137.952, "r_y3": 351.634, "coord_origin": "TOPLEFT"}, "text": "produces downsampled images with", "orig": "produces downsampled images with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 372.142, "r_x1": 155.357, "r_y1": 372.142, "r_x2": 155.357, "r_y2": 363.59, "r_x3": 50.112, "r_y3": 363.59, "coord_origin": "TOPLEFT"}, "text": "indistinguishable features.", "orig": "indistinguishable features.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.378, "r_y0": 372.142, "r_x1": 286.365, "r_y1": 372.142, "r_x2": 286.365, "r_y2": 363.59, "r_x3": 160.378, "r_y3": 363.59, "coord_origin": "TOPLEFT"}, "text": "This problem can be addressed", "orig": "This problem can be addressed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 384.097, "r_x1": 286.365, "r_y1": 384.097, "r_x2": 286.365, "r_y2": 375.545, "r_x3": 50.112, "r_y3": 375.545, "coord_origin": "TOPLEFT"}, "text": "by treating such big tables with a separate model which ac-", "orig": "by treating such big tables with a separate model which ac-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 396.052, "r_x1": 170.012, "r_y1": 396.052, "r_x2": 170.012, "r_y2": 387.5, "r_x3": 50.112, "r_y3": 387.5, "coord_origin": "TOPLEFT"}, "text": "cepts a large input image size.", "orig": "cepts a large input image size.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Structure. As shown in Tab. 2, TableFormer outperforms all SOTA methods across different datasets by a large margin for predicting the table structure from an image. All the more, our model outperforms pre-trained methods. During the evaluation we do not apply any table filtering. We also provide our baseline results on the SynthTabNet dataset. It has been observed that large tables (e.g. tables that occupy half of the page or more) yield poor predictions. We attribute this issue to the image resizing during the preprocessing step, that produces downsampled images with indistinguishable features. This problem can be addressed by treating such big tables with a separate model which accepts a large input image size."}, {"label": "table", "id": 0, "page_no": 6, "cluster": {"id": 0, "label": "table", "bbox": {"l": 53.368526458740234, "t": 409.1357727050781, "r": 283.0443420410156, "b": 582.3977661132812, "coord_origin": "TOPLEFT"}, "confidence": 0.9892510175704956, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.843, "r_y0": 429.511, "r_x1": 104.855, "r_y1": 429.511, "r_x2": 104.855, "r_y2": 420.959, "r_x3": 78.843, "r_y3": 420.959, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.2, "r_y0": 423.533, "r_x1": 236.107, "r_y1": 423.533, "r_x2": 236.107, "r_y2": 414.981, "r_x3": 211.2, "r_y3": 414.981, "coord_origin": "TOPLEFT"}, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.338, "r_y0": 435.488, "r_x1": 159.216, "r_y1": 435.488, "r_x2": 159.216, "r_y2": 426.936, "r_x3": 129.338, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.171, "r_y0": 435.488, "r_x1": 199.405, "r_y1": 435.488, "r_x2": 199.405, "r_y2": 426.936, "r_x3": 171.171, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.36, "r_y0": 435.488, "r_x1": 247.744, "r_y1": 435.488, "r_x2": 247.744, "r_y2": 426.936, "r_x3": 211.36, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.54, "r_y0": 435.488, "r_x1": 277.273, "r_y1": 435.488, "r_x2": 277.273, "r_y2": 426.936, "r_x3": 264.54, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 452.445, "r_x1": 102.085, "r_y1": 452.445, "r_x2": 102.085, "r_y2": 443.893, "r_x3": 81.612, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.872, "r_y0": 452.445, "r_x1": 153.691, "r_y1": 452.445, "r_x2": 153.691, "r_y2": 443.893, "r_x3": 134.872, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 452.445, "r_x1": 194.0, "r_y1": 452.445, "r_x2": 194.0, "r_y2": 443.893, "r_x3": 176.566, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.829, "r_y0": 452.445, "r_x1": 238.264, "r_y1": 452.445, "r_x2": 238.264, "r_y2": 443.893, "r_x3": 220.829, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 452.445, "r_x1": 279.619, "r_y1": 452.445, "r_x2": 279.619, "r_y2": 443.893, "r_x3": 262.184, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.165, "r_y0": 464.401, "r_x1": 101.532, "r_y1": 464.401, "r_x2": 101.532, "r_y2": 455.849, "r_x3": 82.165, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.867, "r_y0": 464.401, "r_x1": 153.687, "r_y1": 464.401, "r_x2": 153.687, "r_y2": 455.849, "r_x3": 134.867, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.624, "r_y0": 464.401, "r_x1": 186.942, "r_y1": 464.401, "r_x2": 186.942, "r_y2": 455.849, "r_x3": 183.624, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 464.401, "r_x1": 231.205, "r_y1": 464.401, "r_x2": 231.205, "r_y2": 455.849, "r_x3": 227.888, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.699, "r_y0": 464.401, "r_x1": 282.114, "r_y1": 464.401, "r_x2": 282.114, "r_y2": 455.849, "r_x3": 259.699, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 476.954, "r_x1": 117.383, "r_y1": 476.954, "r_x2": 117.383, "r_y2": 468.402, "r_x3": 66.315, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 476.954, "r_x1": 153.687, "r_y1": 476.954, "r_x2": 153.687, "r_y2": 468.402, "r_x3": 134.868, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 476.954, "r_x1": 194.006, "r_y1": 476.954, "r_x2": 194.006, "r_y2": 468.402, "r_x3": 176.571, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 476.954, "r_x1": 238.269, "r_y1": 476.954, "r_x2": 238.269, "r_y2": 468.402, "r_x3": 220.835, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.698, "r_y0": 476.97, "r_x1": 282.114, "r_y1": 476.97, "r_x2": 282.114, "r_y2": 468.014, "r_x3": 259.698, "r_y3": 468.014, "coord_origin": "TOPLEFT"}, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 492.147, "r_x1": 102.085, "r_y1": 492.147, "r_x2": 102.085, "r_y2": 483.595, "r_x3": 81.612, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.872, "r_y0": 492.147, "r_x1": 153.691, "r_y1": 492.147, "r_x2": 153.691, "r_y2": 483.595, "r_x3": 134.872, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 492.147, "r_x1": 194.0, "r_y1": 492.147, "r_x2": 194.0, "r_y2": 483.595, "r_x3": 176.566, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 218.339, "r_y0": 492.147, "r_x1": 240.755, "r_y1": 492.147, "r_x2": 240.755, "r_y2": 483.595, "r_x3": 218.339, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 492.147, "r_x1": 279.619, "r_y1": 492.147, "r_x2": 279.619, "r_y2": 483.595, "r_x3": 262.184, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.165, "r_y0": 504.102, "r_x1": 101.532, "r_y1": 504.102, "r_x2": 101.532, "r_y2": 495.55, "r_x3": 82.165, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.867, "r_y0": 504.102, "r_x1": 153.687, "r_y1": 504.102, "r_x2": 153.687, "r_y2": 495.55, "r_x3": 134.867, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.624, "r_y0": 504.102, "r_x1": 186.942, "r_y1": 504.102, "r_x2": 186.942, "r_y2": 495.55, "r_x3": 183.624, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 504.102, "r_x1": 231.205, "r_y1": 504.102, "r_x2": 231.205, "r_y2": 495.55, "r_x3": 227.888, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.699, "r_y0": 504.102, "r_x1": 282.114, "r_y1": 504.102, "r_x2": 282.114, "r_y2": 495.55, "r_x3": 259.699, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 71.789, "r_y0": 516.057, "r_x1": 111.908, "r_y1": 516.057, "r_x2": 111.908, "r_y2": 507.505, "r_x3": 71.789, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.862, "r_y0": 516.057, "r_x1": 153.682, "r_y1": 516.057, "r_x2": 153.682, "r_y2": 507.505, "r_x3": 134.862, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.629, "r_y0": 516.057, "r_x1": 186.947, "r_y1": 516.057, "r_x2": 186.947, "r_y2": 507.505, "r_x3": 183.629, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.893, "r_y0": 516.057, "r_x1": 231.211, "r_y1": 516.057, "r_x2": 231.211, "r_y2": 507.505, "r_x3": 227.893, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.694, "r_y0": 516.057, "r_x1": 282.109, "r_y1": 516.057, "r_x2": 282.109, "r_y2": 507.505, "r_x3": 259.694, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 528.012, "r_x1": 117.383, "r_y1": 528.012, "r_x2": 117.383, "r_y2": 519.46, "r_x3": 66.315, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 528.012, "r_x1": 153.687, "r_y1": 528.012, "r_x2": 153.687, "r_y2": 519.46, "r_x3": 134.868, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 528.012, "r_x1": 194.006, "r_y1": 528.012, "r_x2": 194.006, "r_y2": 519.46, "r_x3": 176.571, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 528.012, "r_x1": 238.269, "r_y1": 528.012, "r_x2": 238.269, "r_y2": 519.46, "r_x3": 220.835, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.189, "r_y0": 528.028, "r_x1": 279.624, "r_y1": 528.028, "r_x2": 279.624, "r_y2": 519.072, "r_x3": 262.189, "r_y3": 519.072, "coord_origin": "TOPLEFT"}, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 545.319, "r_x1": 102.085, "r_y1": 545.319, "r_x2": 102.085, "r_y2": 536.767, "r_x3": 81.612, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.911, "r_y0": 545.319, "r_x1": 150.643, "r_y1": 545.319, "r_x2": 150.643, "r_y2": 536.767, "r_x3": 137.911, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 545.319, "r_x1": 194.0, "r_y1": 545.319, "r_x2": 194.0, "r_y2": 536.767, "r_x3": 176.566, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.893, "r_y0": 545.319, "r_x1": 231.21, "r_y1": 545.319, "r_x2": 231.21, "r_y2": 536.767, "r_x3": 227.893, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 545.319, "r_x1": 279.619, "r_y1": 545.319, "r_x2": 279.619, "r_y2": 536.767, "r_x3": 262.184, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 557.275, "r_x1": 117.383, "r_y1": 557.275, "r_x2": 117.383, "r_y2": 548.723, "r_x3": 66.315, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.906, "r_y0": 557.275, "r_x1": 150.638, "r_y1": 557.275, "r_x2": 150.638, "r_y2": 548.723, "r_x3": 137.906, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 557.275, "r_x1": 194.006, "r_y1": 557.275, "r_x2": 194.006, "r_y2": 548.723, "r_x3": 176.571, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 557.275, "r_x1": 231.206, "r_y1": 557.275, "r_x2": 231.206, "r_y2": 548.723, "r_x3": 227.888, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.189, "r_y0": 557.2909999999999, "r_x1": 279.624, "r_y1": 557.2909999999999, "r_x2": 279.624, "r_y2": 548.335, "r_x3": 262.189, "r_y3": 548.335, "coord_origin": "TOPLEFT"}, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 576.823, "r_x1": 117.383, "r_y1": 576.823, "r_x2": 117.383, "r_y2": 568.271, "r_x3": 66.315, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 576.823, "r_x1": 153.687, "r_y1": 576.823, "r_x2": 153.687, "r_y2": 568.271, "r_x3": 134.868, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 576.823, "r_x1": 194.006, "r_y1": 576.823, "r_x2": 194.006, "r_y2": 568.271, "r_x3": 176.571, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 576.823, "r_x1": 238.269, "r_y1": 576.823, "r_x2": 238.269, "r_y2": 568.271, "r_x3": 220.835, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.19, "r_y0": 576.823, "r_x1": 279.624, "r_y1": 576.823, "r_x2": 279.624, "r_y2": 568.271, "r_x3": 262.19, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 27, "label": "text", "bbox": {"l": 78.843, "t": 420.959, "r": 104.855, "b": 429.511, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.843, "r_y0": 429.511, "r_x1": 104.855, "r_y1": 429.511, "r_x2": 104.855, "r_y2": 420.959, "r_x3": 78.843, "r_y3": 420.959, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 28, "label": "text", "bbox": {"l": 211.2, "t": 414.981, "r": 236.107, "b": 423.533, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.2, "r_y0": 423.533, "r_x1": 236.107, "r_y1": 423.533, "r_x2": 236.107, "r_y2": 414.981, "r_x3": 211.2, "r_y3": 414.981, "coord_origin": "TOPLEFT"}, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "text", "bbox": {"l": 129.338, "t": 426.936, "r": 159.216, "b": 435.488, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.338, "r_y0": 435.488, "r_x1": 159.216, "r_y1": 435.488, "r_x2": 159.216, "r_y2": 426.936, "r_x3": 129.338, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 30, "label": "text", "bbox": {"l": 171.171, "t": 426.936, "r": 199.405, "b": 435.488, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.171, "r_y0": 435.488, "r_x1": 199.405, "r_y1": 435.488, "r_x2": 199.405, "r_y2": 426.936, "r_x3": 171.171, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "text", "bbox": {"l": 211.36, "t": 426.936, "r": 247.744, "b": 435.488, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.36, "r_y0": 435.488, "r_x1": 247.744, "r_y1": 435.488, "r_x2": 247.744, "r_y2": 426.936, "r_x3": 211.36, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 32, "label": "text", "bbox": {"l": 264.54, "t": 426.936, "r": 277.273, "b": 435.488, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.54, "r_y0": 435.488, "r_x1": 277.273, "r_y1": 435.488, "r_x2": 277.273, "r_y2": 426.936, "r_x3": 264.54, "r_y3": 426.936, "coord_origin": "TOPLEFT"}, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 33, "label": "text", "bbox": {"l": 81.612, "t": 443.893, "r": 102.085, "b": 452.445, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 452.445, "r_x1": 102.085, "r_y1": 452.445, "r_x2": 102.085, "r_y2": 443.893, "r_x3": 81.612, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 34, "label": "text", "bbox": {"l": 134.872, "t": 443.893, "r": 153.691, "b": 452.445, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.872, "r_y0": 452.445, "r_x1": 153.691, "r_y1": 452.445, "r_x2": 153.691, "r_y2": 443.893, "r_x3": 134.872, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 35, "label": "text", "bbox": {"l": 176.566, "t": 443.893, "r": 194.0, "b": 452.445, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 452.445, "r_x1": 194.0, "r_y1": 452.445, "r_x2": 194.0, "r_y2": 443.893, "r_x3": 176.566, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "91.1", "orig": "91.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 36, "label": "text", "bbox": {"l": 220.829, "t": 443.893, "r": 238.264, "b": 452.445, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.829, "r_y0": 452.445, "r_x1": 238.264, "r_y1": 452.445, "r_x2": 238.264, "r_y2": 443.893, "r_x3": 220.829, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "88.7", "orig": "88.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 37, "label": "text", "bbox": {"l": 262.184, "t": 443.893, "r": 279.619, "b": 452.445, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 452.445, "r_x1": 279.619, "r_y1": 452.445, "r_x2": 279.619, "r_y2": 443.893, "r_x3": 262.184, "r_y3": 443.893, "coord_origin": "TOPLEFT"}, "text": "89.9", "orig": "89.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 38, "label": "text", "bbox": {"l": 82.165, "t": 455.849, "r": 101.532, "b": 464.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.165, "r_y0": 464.401, "r_x1": 101.532, "r_y1": 464.401, "r_x2": 101.532, "r_y2": 455.849, "r_x3": 82.165, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 39, "label": "text", "bbox": {"l": 134.867, "t": 455.849, "r": 153.687, "b": 464.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.867, "r_y0": 464.401, "r_x1": 153.687, "r_y1": 464.401, "r_x2": 153.687, "r_y2": 455.849, "r_x3": 134.867, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 40, "label": "text", "bbox": {"l": 183.624, "t": 455.849, "r": 186.942, "b": 464.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.624, "r_y0": 464.401, "r_x1": 186.942, "r_y1": 464.401, "r_x2": 186.942, "r_y2": 455.849, "r_x3": 183.624, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "text", "bbox": {"l": 227.888, "t": 455.849, "r": 231.205, "b": 464.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 464.401, "r_x1": 231.205, "r_y1": 464.401, "r_x2": 231.205, "r_y2": 455.849, "r_x3": 227.888, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 42, "label": "text", "bbox": {"l": 259.699, "t": 455.849, "r": 282.114, "b": 464.401, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.699, "r_y0": 464.401, "r_x1": 282.114, "r_y1": 464.401, "r_x2": 282.114, "r_y2": 455.849, "r_x3": 259.699, "r_y3": 455.849, "coord_origin": "TOPLEFT"}, "text": "93.01", "orig": "93.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 43, "label": "text", "bbox": {"l": 66.315, "t": 468.402, "r": 117.383, "b": 476.954, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 476.954, "r_x1": 117.383, "r_y1": 476.954, "r_x2": 117.383, "r_y2": 468.402, "r_x3": 66.315, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 44, "label": "text", "bbox": {"l": 134.868, "t": 468.402, "r": 153.687, "b": 476.954, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 476.954, "r_x1": 153.687, "r_y1": 476.954, "r_x2": 153.687, "r_y2": 468.402, "r_x3": 134.868, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "PTN", "orig": "PTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 45, "label": "text", "bbox": {"l": 176.571, "t": 468.402, "r": 194.006, "b": 476.954, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 476.954, "r_x1": 194.006, "r_y1": 476.954, "r_x2": 194.006, "r_y2": 468.402, "r_x3": 176.571, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "98.5", "orig": "98.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 46, "label": "text", "bbox": {"l": 220.835, "t": 468.402, "r": 238.269, "b": 476.954, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 476.954, "r_x1": 238.269, "r_y1": 476.954, "r_x2": 238.269, "r_y2": 468.402, "r_x3": 220.835, "r_y3": 468.402, "coord_origin": "TOPLEFT"}, "text": "95.0", "orig": "95.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 259.698, "t": 468.014, "r": 282.114, "b": 476.97, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.698, "r_y0": 476.97, "r_x1": 282.114, "r_y1": 476.97, "r_x2": 282.114, "r_y2": 468.014, "r_x3": 259.698, "r_y3": 468.014, "coord_origin": "TOPLEFT"}, "text": "96.75", "orig": "96.75", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 81.612, "t": 483.595, "r": 102.085, "b": 492.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 492.147, "r_x1": 102.085, "r_y1": 492.147, "r_x2": 102.085, "r_y2": 483.595, "r_x3": 81.612, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 134.872, "t": 483.595, "r": 153.691, "b": 492.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.872, "r_y0": 492.147, "r_x1": 153.691, "r_y1": 492.147, "r_x2": 153.691, "r_y2": 483.595, "r_x3": 134.872, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 176.566, "t": 483.595, "r": 194.0, "b": 492.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 492.147, "r_x1": 194.0, "r_y1": 492.147, "r_x2": 194.0, "r_y2": 483.595, "r_x3": 176.566, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "88.4", "orig": "88.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 218.339, "t": 483.595, "r": 240.755, "b": 492.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 218.339, "r_y0": 492.147, "r_x1": 240.755, "r_y1": 492.147, "r_x2": 240.755, "r_y2": 483.595, "r_x3": 218.339, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "92.08", "orig": "92.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 262.184, "t": 483.595, "r": 279.619, "b": 492.147, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 492.147, "r_x1": 279.619, "r_y1": 492.147, "r_x2": 279.619, "r_y2": 483.595, "r_x3": 262.184, "r_y3": 483.595, "coord_origin": "TOPLEFT"}, "text": "90.6", "orig": "90.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 82.165, "t": 495.55, "r": 101.532, "b": 504.102, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.165, "r_y0": 504.102, "r_x1": 101.532, "r_y1": 504.102, "r_x2": 101.532, "r_y2": 495.55, "r_x3": 82.165, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "GTE", "orig": "GTE", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 134.867, "t": 495.55, "r": 153.687, "b": 504.102, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.867, "r_y0": 504.102, "r_x1": 153.687, "r_y1": 504.102, "r_x2": 153.687, "r_y2": 495.55, "r_x3": 134.867, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 183.624, "t": 495.55, "r": 186.942, "b": 504.102, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.624, "r_y0": 504.102, "r_x1": 186.942, "r_y1": 504.102, "r_x2": 186.942, "r_y2": 495.55, "r_x3": 183.624, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 227.888, "t": 495.55, "r": 231.205, "b": 504.102, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 504.102, "r_x1": 231.205, "r_y1": 504.102, "r_x2": 231.205, "r_y2": 495.55, "r_x3": 227.888, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 259.699, "t": 495.55, "r": 282.114, "b": 504.102, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.699, "r_y0": 504.102, "r_x1": 282.114, "r_y1": 504.102, "r_x2": 282.114, "r_y2": 495.55, "r_x3": 259.699, "r_y3": 495.55, "coord_origin": "TOPLEFT"}, "text": "87.14", "orig": "87.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 71.789, "t": 507.505, "r": 111.908, "b": 516.057, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 71.789, "r_y0": 516.057, "r_x1": 111.908, "r_y1": 516.057, "r_x2": 111.908, "r_y2": 507.505, "r_x3": 71.789, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "GTE (FT)", "orig": "GTE (FT)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 134.862, "t": 507.505, "r": 153.682, "b": 516.057, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.862, "r_y0": 516.057, "r_x1": 153.682, "r_y1": 516.057, "r_x2": 153.682, "r_y2": 507.505, "r_x3": 134.862, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 183.629, "t": 507.505, "r": 186.947, "b": 516.057, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.629, "r_y0": 516.057, "r_x1": 186.947, "r_y1": 516.057, "r_x2": 186.947, "r_y2": 507.505, "r_x3": 183.629, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 227.893, "t": 507.505, "r": 231.211, "b": 516.057, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.893, "r_y0": 516.057, "r_x1": 231.211, "r_y1": 516.057, "r_x2": 231.211, "r_y2": 507.505, "r_x3": 227.893, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 259.694, "t": 507.505, "r": 282.109, "b": 516.057, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.694, "r_y0": 516.057, "r_x1": 282.109, "r_y1": 516.057, "r_x2": 282.109, "r_y2": 507.505, "r_x3": 259.694, "r_y3": 507.505, "coord_origin": "TOPLEFT"}, "text": "91.02", "orig": "91.02", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 66.315, "t": 519.46, "r": 117.383, "b": 528.012, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 528.012, "r_x1": 117.383, "r_y1": 528.012, "r_x2": 117.383, "r_y2": 519.46, "r_x3": 66.315, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 134.868, "t": 519.46, "r": 153.687, "b": 528.012, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 528.012, "r_x1": 153.687, "r_y1": 528.012, "r_x2": 153.687, "r_y2": 519.46, "r_x3": 134.868, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "FTN", "orig": "FTN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 176.571, "t": 519.46, "r": 194.006, "b": 528.012, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 528.012, "r_x1": 194.006, "r_y1": 528.012, "r_x2": 194.006, "r_y2": 519.46, "r_x3": 176.571, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "97.5", "orig": "97.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 220.835, "t": 519.46, "r": 238.269, "b": 528.012, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 528.012, "r_x1": 238.269, "r_y1": 528.012, "r_x2": 238.269, "r_y2": 519.46, "r_x3": 220.835, "r_y3": 519.46, "coord_origin": "TOPLEFT"}, "text": "96.0", "orig": "96.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 262.189, "t": 519.072, "r": 279.624, "b": 528.028, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.189, "r_y0": 528.028, "r_x1": 279.624, "r_y1": 528.028, "r_x2": 279.624, "r_y2": 519.072, "r_x3": 262.189, "r_y3": 519.072, "coord_origin": "TOPLEFT"}, "text": "96.8", "orig": "96.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 81.612, "t": 536.767, "r": 102.085, "b": 545.319, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.612, "r_y0": 545.319, "r_x1": 102.085, "r_y1": 545.319, "r_x2": 102.085, "r_y2": 536.767, "r_x3": 81.612, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 137.911, "t": 536.767, "r": 150.643, "b": 545.319, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.911, "r_y0": 545.319, "r_x1": 150.643, "r_y1": 545.319, "r_x2": 150.643, "r_y2": 536.767, "r_x3": 137.911, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 176.566, "t": 536.767, "r": 194.0, "b": 545.319, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.566, "r_y0": 545.319, "r_x1": 194.0, "r_y1": 545.319, "r_x2": 194.0, "r_y2": 536.767, "r_x3": 176.566, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 227.893, "t": 536.767, "r": 231.21, "b": 545.319, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.893, "r_y0": 545.319, "r_x1": 231.21, "r_y1": 545.319, "r_x2": 231.21, "r_y2": 536.767, "r_x3": 227.893, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 262.184, "t": 536.767, "r": 279.619, "b": 545.319, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.184, "r_y0": 545.319, "r_x1": 279.619, "r_y1": 545.319, "r_x2": 279.619, "r_y2": 536.767, "r_x3": 262.184, "r_y3": 536.767, "coord_origin": "TOPLEFT"}, "text": "86.0", "orig": "86.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 66.315, "t": 548.723, "r": 117.383, "b": 557.275, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 557.275, "r_x1": 117.383, "r_y1": 557.275, "r_x2": 117.383, "r_y2": 548.723, "r_x3": 66.315, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 137.906, "t": 548.723, "r": 150.638, "b": 557.275, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.906, "r_y0": 557.275, "r_x1": 150.638, "r_y1": 557.275, "r_x2": 150.638, "r_y2": 548.723, "r_x3": 137.906, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "TB", "orig": "TB", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 176.571, "t": 548.723, "r": 194.006, "b": 557.275, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 557.275, "r_x1": 194.006, "r_y1": 557.275, "r_x2": 194.006, "r_y2": 548.723, "r_x3": 176.571, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 227.888, "t": 548.723, "r": 231.206, "b": 557.275, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.888, "r_y0": 557.275, "r_x1": 231.206, "r_y1": 557.275, "r_x2": 231.206, "r_y2": 548.723, "r_x3": 227.888, "r_y3": 548.723, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 262.189, "t": 548.335, "r": 279.624, "b": 557.2909999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.189, "r_y0": 557.2909999999999, "r_x1": 279.624, "r_y1": 557.2909999999999, "r_x2": 279.624, "r_y2": 548.335, "r_x3": 262.189, "r_y3": 548.335, "coord_origin": "TOPLEFT"}, "text": "89.6", "orig": "89.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 66.315, "t": 568.271, "r": 117.383, "b": 576.823, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 66.315, "r_y0": 576.823, "r_x1": 117.383, "r_y1": 576.823, "r_x2": 117.383, "r_y2": 568.271, "r_x3": 66.315, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 134.868, "t": 568.271, "r": 153.687, "b": 576.823, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 134.868, "r_y0": 576.823, "r_x1": 153.687, "r_y1": 576.823, "r_x2": 153.687, "r_y2": 568.271, "r_x3": 134.868, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "STN", "orig": "STN", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 176.571, "t": 568.271, "r": 194.006, "b": 576.823, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.571, "r_y0": 576.823, "r_x1": 194.006, "r_y1": 576.823, "r_x2": 194.006, "r_y2": 568.271, "r_x3": 176.571, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "96.9", "orig": "96.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 220.835, "t": 568.271, "r": 238.269, "b": 576.823, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.835, "r_y0": 576.823, "r_x1": 238.269, "r_y1": 576.823, "r_x2": 238.269, "r_y2": 568.271, "r_x3": 220.835, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "95.7", "orig": "95.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 82, "label": "text", "bbox": {"l": 262.19, "t": 568.271, "r": 279.624, "b": 576.823, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.19, "r_y0": 576.823, "r_x1": 279.624, "r_y1": 576.823, "r_x2": 279.624, "r_y2": 568.271, "r_x3": 262.19, "r_y3": 568.271, "coord_origin": "TOPLEFT"}, "text": "96.7", "orig": "96.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 11, "num_cols": 5, "table_cells": [{"bbox": {"l": 78.843, "t": 420.959, "r": 104.855, "b": 429.511, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 211.2, "t": 414.981, "r": 247.744, "b": 435.488, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "TEDS Complex", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 129.338, "t": 426.936, "r": 159.216, "b": 435.488, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Dataset", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 171.171, "t": 426.936, "r": 199.405, "b": 435.488, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "Simple", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 264.54, "t": 426.936, "r": 277.273, "b": 435.488, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "All", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 81.612, "t": 443.893, "r": 102.085, "b": 452.445, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.872, "t": 443.893, "r": 153.691, "b": 452.445, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.566, "t": 443.893, "r": 194.0, "b": 452.445, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "91.1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.829, "t": 443.893, "r": 238.264, "b": 452.445, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "88.7", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 262.184, "t": 443.893, "r": 279.619, "b": 452.445, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "89.9", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 82.165, "t": 455.849, "r": 101.532, "b": 464.401, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.867, "t": 455.849, "r": 153.687, "b": 464.401, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 183.624, "t": 455.849, "r": 186.942, "b": 464.401, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 227.888, "t": 455.849, "r": 231.205, "b": 464.401, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 259.699, "t": 455.849, "r": 282.114, "b": 464.401, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "93.01", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 66.315, "t": 468.402, "r": 117.383, "b": 476.954, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.868, "t": 468.402, "r": 153.687, "b": 476.954, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.571, "t": 468.402, "r": 194.006, "b": 476.954, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "98.5", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.835, "t": 468.402, "r": 238.269, "b": 476.954, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "95.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 259.698, "t": 468.014, "r": 282.114, "b": 476.97, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.75", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 81.612, "t": 483.595, "r": 102.085, "b": 492.147, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.872, "t": 483.595, "r": 153.691, "b": 492.147, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.566, "t": 483.595, "r": 194.0, "b": 492.147, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "88.4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 218.339, "t": 483.595, "r": 240.755, "b": 492.147, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "92.08", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 262.184, "t": 483.595, "r": 279.619, "b": 492.147, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "90.6", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 82.165, "t": 495.55, "r": 101.532, "b": 504.102, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.867, "t": 495.55, "r": 153.687, "b": 504.102, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 183.624, "t": 495.55, "r": 186.942, "b": 504.102, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 227.888, "t": 495.55, "r": 231.205, "b": 504.102, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 259.699, "t": 495.55, "r": 282.114, "b": 504.102, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "87.14", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 71.789, "t": 507.505, "r": 111.908, "b": 516.057, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "GTE (FT)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.862, "t": 507.505, "r": 153.682, "b": 516.057, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 183.629, "t": 507.505, "r": 186.947, "b": 516.057, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 227.893, "t": 507.505, "r": 231.211, "b": 516.057, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 259.694, "t": 507.505, "r": 282.109, "b": 516.057, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "91.02", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 66.315, "t": 519.46, "r": 117.383, "b": 528.012, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.868, "t": 519.46, "r": 153.687, "b": 528.012, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "FTN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.571, "t": 519.46, "r": 194.006, "b": 528.012, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "97.5", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.835, "t": 519.46, "r": 238.269, "b": 528.012, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "96.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 262.189, "t": 519.072, "r": 279.624, "b": 528.028, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.8", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 81.612, "t": 536.767, "r": 102.085, "b": 545.319, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 137.911, "t": 536.767, "r": 150.643, "b": 545.319, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "TB", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.566, "t": 536.767, "r": 194.0, "b": 545.319, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "86.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 227.893, "t": 536.767, "r": 231.21, "b": 545.319, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 262.184, "t": 536.767, "r": 279.619, "b": 545.319, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "86.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 66.315, "t": 548.723, "r": 117.383, "b": 557.275, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 137.906, "t": 548.723, "r": 150.638, "b": 557.275, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "TB", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.571, "t": 548.723, "r": 194.006, "b": 557.275, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "89.6", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 227.888, "t": 548.723, "r": 231.206, "b": 557.275, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 262.189, "t": 548.335, "r": 279.624, "b": 557.2909999999999, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "89.6", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 66.315, "t": 568.271, "r": 117.383, "b": 576.823, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 134.868, "t": 568.271, "r": 153.687, "b": 576.823, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "STN", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 176.571, "t": 568.271, "r": 194.006, "b": 576.823, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "96.9", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 220.835, "t": 568.271, "r": 238.269, "b": 576.823, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "95.7", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 262.19, "t": 568.271, "r": 279.624, "b": 576.823, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 10, "end_row_offset_idx": 11, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "96.7", "column_header": false, "row_header": false, "row_section": false}]}, {"label": "text", "id": 15, "page_no": 6, "cluster": {"id": 15, "label": "text", "bbox": {"l": 50.112, "t": 592.702, "r": 286.365, "b": 613.2090000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.7209173440933228, "cells": [{"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 601.254, "r_x1": 82.062, "r_y1": 601.254, "r_x2": 82.062, "r_y2": 592.702, "r_x3": 50.112, "r_y3": 592.702, "coord_origin": "TOPLEFT"}, "text": "Table 2:", "orig": "Table 2:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.382, "r_y0": 601.254, "r_x1": 286.365, "r_y1": 601.254, "r_x2": 286.365, "r_y2": 592.702, "r_x3": 87.382, "r_y3": 592.702, "coord_origin": "TOPLEFT"}, "text": "Structure results on PubTabNet (PTN), FinTabNet", "orig": "Structure results on PubTabNet (PTN), FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 613.2090000000001, "r_x1": 247.461, "r_y1": 613.2090000000001, "r_x2": 247.461, "r_y2": 604.657, "r_x3": 50.112, "r_y3": 604.657, "coord_origin": "TOPLEFT"}, "text": "(FTN), TableBank (TB) and SynthTabNet (STN).", "orig": "(FTN), TableBank (TB) and SynthTabNet (STN).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table 2: Structure results on PubTabNet (PTN), FinTabNet (FTN), TableBank (TB) and SynthTabNet (STN)."}, {"label": "text", "id": 16, "page_no": 6, "cluster": {"id": 16, "label": "text", "bbox": {"l": 50.112, "t": 616.612, "r": 261.787, "b": 625.164, "coord_origin": "TOPLEFT"}, "confidence": 0.6433312892913818, "cells": [{"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 625.164, "r_x1": 261.787, "r_y1": 625.164, "r_x2": 261.787, "r_y2": 616.612, "r_x3": 50.112, "r_y3": 616.612, "coord_origin": "TOPLEFT"}, "text": "FT: Model was trained on PubTabNet then finetuned.", "orig": "FT: Model was trained on PubTabNet then finetuned.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "FT: Model was trained on PubTabNet then finetuned."}, {"label": "text", "id": 3, "page_no": 6, "cluster": {"id": 3, "label": "text", "bbox": {"l": 50.112, "t": 644.35, "r": 286.366, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9854635000228882, "cells": [{"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 653.306, "r_x1": 124.722, "r_y1": 653.306, "r_x2": 124.722, "r_y2": 644.35, "r_x3": 62.067, "r_y3": 644.35, "coord_origin": "TOPLEFT"}, "text": "Cell Detection.", "orig": "Cell Detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.204, "r_y0": 653.29, "r_x1": 242.933, "r_y1": 653.29, "r_x2": 242.933, "r_y2": 644.738, "r_x3": 128.204, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "Like any object detector, our", "orig": "Like any object detector, our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 245.554, "r_y0": 653.1469999999999, "r_x1": 286.361, "r_y1": 653.1469999999999, "r_x2": 286.361, "r_y2": 644.559, "r_x3": 245.554, "r_y3": 644.559, "coord_origin": "TOPLEFT"}, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 665.102, "r_x1": 84.971, "r_y1": 665.102, "r_x2": 84.971, "r_y2": 656.514, "r_x3": 50.112, "r_y3": 656.514, "coord_origin": "TOPLEFT"}, "text": "Detector", "orig": "Detector", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 89.515, "r_y0": 665.245, "r_x1": 123.677, "r_y1": 665.245, "r_x2": 123.677, "r_y2": 656.693, "r_x3": 89.515, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "provides", "orig": "provides", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 127.991, "r_y0": 665.245, "r_x1": 286.366, "r_y1": 665.245, "r_x2": 286.366, "r_y2": 656.693, "r_x3": 127.991, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "bounding boxes that can be improved", "orig": "bounding boxes that can be improved", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.2, "r_x1": 286.365, "r_y1": 677.2, "r_x2": 286.365, "r_y2": 668.648, "r_x3": 50.112, "r_y3": 668.648, "coord_origin": "TOPLEFT"}, "text": "with post-processing during inference. We make use of the", "orig": "with post-processing during inference. We make use of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 259.655, "r_y1": 689.156, "r_x2": 259.655, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "grid-like structure of tables to refine the predictions.", "orig": "grid-like structure of tables to refine the predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.65, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 263.65, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "A de-", "orig": "A de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "tailed explanation on the post-processing is available in the", "orig": "tailed explanation on the post-processing is available in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 147.068, "r_y1": 713.066, "r_x2": 147.068, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "supplementary material.", "orig": "supplementary material.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.159, "r_y0": 713.066, "r_x1": 223.003, "r_y1": 713.066, "r_x2": 223.003, "r_y2": 704.514, "r_x3": 152.159, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "As shown in Tab.", "orig": "As shown in Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.094, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 228.094, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "3, we evaluate", "orig": "3, we evaluate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Cell Detection. Like any object detector, our Cell BBox Detector provides bounding boxes that can be improved with post-processing during inference. We make use of the grid-like structure of tables to refine the predictions. A detailed explanation on the post-processing is available in the supplementary material. As shown in Tab. 3, we evaluate"}, {"label": "text", "id": 7, "page_no": 6, "cluster": {"id": 7, "label": "text", "bbox": {"l": 308.862, "t": 75.298, "r": 545.115, "b": 227.49099999999999, "coord_origin": "TOPLEFT"}, "confidence": 0.9713197946548462, "cells": [{"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 84.029, "r_x1": 322.142, "r_y1": 84.029, "r_x2": 322.142, "r_y2": 75.47699999999998, "r_x3": 308.862, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "our", "orig": "our", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 325.454, "r_y0": 83.88599999999997, "r_x1": 404.567, "r_y1": 83.88599999999997, "r_x2": 404.567, "r_y2": 75.298, "r_x3": 325.454, "r_y3": 75.298, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.104, "r_y0": 84.029, "r_x1": 545.11, "r_y1": 84.029, "r_x2": 545.11, "r_y2": 75.47699999999998, "r_x3": 408.104, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "accuracy for cells with a class la-", "orig": "accuracy for cells with a class la-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 95.98400000000004, "r_x1": 545.115, "r_y1": 95.98400000000004, "r_x2": 545.115, "r_y2": 87.43200000000002, "r_x3": 308.862, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "bel of 'content' only using the PASCAL VOC mAP metric", "orig": "bel of 'content' only using the PASCAL VOC mAP metric", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 107.93899999999996, "r_x1": 320.478, "r_y1": 107.93899999999996, "r_x2": 320.478, "r_y2": 99.38699999999994, "r_x3": 308.862, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 324.374, "r_y0": 107.93899999999996, "r_x1": 470.226, "r_y1": 107.93899999999996, "r_x2": 470.226, "r_y2": 99.38699999999994, "r_x3": 324.374, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "pre-processing and post-processing.", "orig": "pre-processing and post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.529, "r_y0": 107.93899999999996, "r_x1": 545.115, "r_y1": 107.93899999999996, "r_x2": 545.115, "r_y2": 99.38699999999994, "r_x3": 477.529, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "Note that we do", "orig": "Note that we do", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 119.894, "r_x1": 545.115, "r_y1": 119.894, "r_x2": 545.115, "r_y2": 111.34199999999998, "r_x3": 308.862, "r_y3": 111.34199999999998, "coord_origin": "TOPLEFT"}, "text": "not have post-processing results for SynthTabNet as images", "orig": "not have post-processing results for SynthTabNet as images", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 131.84900000000005, "r_x1": 545.115, "r_y1": 131.84900000000005, "r_x2": 545.115, "r_y2": 123.29700000000003, "r_x3": 308.862, "r_y3": 123.29700000000003, "coord_origin": "TOPLEFT"}, "text": "are only provided. To compare the performance of our pro-", "orig": "are only provided. To compare the performance of our pro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 143.80499999999995, "r_x1": 502.017, "r_y1": 143.80499999999995, "r_x2": 502.017, "r_y2": 135.25300000000004, "r_x3": 308.862, "r_y3": 135.25300000000004, "coord_origin": "TOPLEFT"}, "text": "posed approach, we've integrated TableFormer's", "orig": "posed approach, we've integrated TableFormer's", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 504.473, "r_y0": 143.66200000000003, "r_x1": 545.11, "r_y1": 143.66200000000003, "r_x2": 545.11, "r_y2": 135.07399999999996, "r_x3": 504.473, "r_y3": 135.07399999999996, "coord_origin": "TOPLEFT"}, "text": "Cell BBox", "orig": "Cell BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 155.61699999999996, "r_x1": 343.163, "r_y1": 155.61699999999996, "r_x2": 343.163, "r_y2": 147.029, "r_x3": 308.862, "r_y3": 147.029, "coord_origin": "TOPLEFT"}, "text": "Decoder", "orig": "Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.371, "r_y0": 155.76, "r_x1": 437.818, "r_y1": 155.76, "r_x2": 437.818, "r_y2": 147.20799999999997, "r_x3": 346.371, "r_y3": 147.20799999999997, "coord_origin": "TOPLEFT"}, "text": "into EDD architecture.", "orig": "into EDD architecture.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 442.371, "r_y0": 155.76, "r_x1": 545.115, "r_y1": 155.76, "r_x2": 545.115, "r_y2": 147.20799999999997, "r_x3": 442.371, "r_y3": 147.20799999999997, "coord_origin": "TOPLEFT"}, "text": "As mentioned previously,", "orig": "As mentioned previously,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 167.71500000000003, "r_x1": 446.157, "r_y1": 167.71500000000003, "r_x2": 446.157, "r_y2": 159.163, "r_x3": 308.862, "r_y3": 159.163, "coord_origin": "TOPLEFT"}, "text": "the Structure Decoder provides the", "orig": "the Structure Decoder provides the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.29, "r_y0": 167.572, "r_x1": 525.042, "r_y1": 167.572, "r_x2": 525.042, "r_y2": 158.98400000000004, "r_x3": 448.29, "r_y3": 158.98400000000004, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 527.399, "r_y0": 167.71500000000003, "r_x1": 545.113, "r_y1": 167.71500000000003, "r_x2": 545.113, "r_y2": 159.163, "r_x3": 527.399, "r_y3": 159.163, "coord_origin": "TOPLEFT"}, "text": "with", "orig": "with", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 179.66999999999996, "r_x1": 545.115, "r_y1": 179.66999999999996, "r_x2": 545.115, "r_y2": 171.11800000000005, "r_x3": 308.862, "r_y3": 171.11800000000005, "coord_origin": "TOPLEFT"}, "text": "the features needed to predict the bounding box predictions.", "orig": "the features needed to predict the bounding box predictions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 191.625, "r_x1": 432.866, "r_y1": 191.625, "r_x2": 432.866, "r_y2": 183.07299999999998, "r_x3": 308.862, "r_y3": 183.07299999999998, "coord_origin": "TOPLEFT"}, "text": "Therefore, the accuracy of the", "orig": "Therefore, the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.39, "r_y0": 191.48199999999997, "r_x1": 510.93, "r_y1": 191.48199999999997, "r_x2": 510.93, "r_y2": 182.894, "r_x3": 436.39, "r_y3": 182.894, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 514.677, "r_y0": 191.625, "r_x1": 545.113, "r_y1": 191.625, "r_x2": 545.113, "r_y2": 183.07299999999998, "r_x3": 514.677, "r_y3": 183.07299999999998, "coord_origin": "TOPLEFT"}, "text": "directly", "orig": "directly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 203.58000000000004, "r_x1": 431.173, "r_y1": 203.58000000000004, "r_x2": 431.173, "r_y2": 195.02800000000002, "r_x3": 308.862, "r_y3": 195.02800000000002, "coord_origin": "TOPLEFT"}, "text": "influences the accuracy of the", "orig": "influences the accuracy of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 434.679, "r_y0": 203.437, "r_x1": 514.181, "r_y1": 203.437, "r_x2": 514.181, "r_y2": 194.84900000000005, "r_x3": 434.679, "r_y3": 194.84900000000005, "coord_origin": "TOPLEFT"}, "text": "Cell BBox Decoder", "orig": "Cell BBox Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 514.176, "r_y0": 203.58000000000004, "r_x1": 516.667, "r_y1": 203.58000000000004, "r_x2": 516.667, "r_y2": 195.02800000000002, "r_x3": 514.176, "r_y3": 195.02800000000002, "coord_origin": "TOPLEFT"}, "text": ".", "orig": ".", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 522.794, "r_y0": 203.58000000000004, "r_x1": 529.429, "r_y1": 203.58000000000004, "r_x2": 529.429, "r_y2": 195.02800000000002, "r_x3": 522.794, "r_y3": 195.02800000000002, "coord_origin": "TOPLEFT"}, "text": "If", "orig": "If", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 532.936, "r_y0": 203.58000000000004, "r_x1": 545.11, "r_y1": 203.58000000000004, "r_x2": 545.11, "r_y2": 195.02800000000002, "r_x3": 532.936, "r_y3": 195.02800000000002, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 215.39300000000003, "r_x1": 382.356, "r_y1": 215.39300000000003, "r_x2": 382.356, "r_y2": 206.80499999999995, "r_x3": 308.862, "r_y3": 206.80499999999995, "coord_origin": "TOPLEFT"}, "text": "Structure Decoder", "orig": "Structure Decoder", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.075, "r_y0": 215.53599999999994, "r_x1": 545.114, "r_y1": 215.53599999999994, "r_x2": 545.114, "r_y2": 206.98400000000004, "r_x3": 385.075, "r_y3": 206.98400000000004, "coord_origin": "TOPLEFT"}, "text": "predicts an extra column, this will result", "orig": "predicts an extra column, this will result", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 227.49099999999999, "r_x1": 501.698, "r_y1": 227.49099999999999, "r_x2": 501.698, "r_y2": 218.93899999999996, "r_x3": 308.862, "r_y3": 218.93899999999996, "coord_origin": "TOPLEFT"}, "text": "in an extra column of predicted bounding boxes.", "orig": "in an extra column of predicted bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "our Cell BBox Decoder accuracy for cells with a class label of 'content' only using the PASCAL VOC mAP metric for pre-processing and post-processing. Note that we do not have post-processing results for SynthTabNet as images are only provided. To compare the performance of our proposed approach, we've integrated TableFormer's Cell BBox Decoder into EDD architecture. As mentioned previously, the Structure Decoder provides the Cell BBox Decoder with the features needed to predict the bounding box predictions. Therefore, the accuracy of the Structure Decoder directly influences the accuracy of the Cell BBox Decoder . If the Structure Decoder predicts an extra column, this will result in an extra column of predicted bounding boxes."}, {"label": "table", "id": 8, "page_no": 6, "cluster": {"id": 8, "label": "table", "bbox": {"l": 308.4068603515625, "t": 247.87631225585938, "r": 533.6419677734375, "b": 303.8056640625, "coord_origin": "TOPLEFT"}, "confidence": 0.9691730737686157, "cells": [{"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.323, "r_y0": 262.485, "r_x1": 365.335, "r_y1": 262.485, "r_x2": 365.335, "r_y2": 253.933, "r_x3": 339.323, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.041, "r_y0": 262.485, "r_x1": 430.919, "r_y1": 262.485, "r_x2": 430.919, "r_y2": 253.933, "r_x3": 401.041, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.102, "r_y0": 262.485, "r_x1": 474.585, "r_y1": 262.485, "r_x2": 474.585, "r_y2": 253.933, "r_x3": 454.102, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 486.54, "r_y0": 262.485, "r_x1": 527.228, "r_y1": 262.485, "r_x2": 527.228, "r_y2": 253.933, "r_x3": 486.54, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.656, "r_y0": 279.442, "r_x1": 377.001, "r_y1": 279.442, "r_x2": 377.001, "r_y2": 270.89, "r_x3": 327.656, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.698, "r_y0": 279.442, "r_x1": 438.281, "r_y1": 279.442, "r_x2": 438.281, "r_y2": 270.89, "r_x3": 393.698, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.636, "r_y0": 279.442, "r_x1": 473.07, "r_y1": 279.442, "r_x2": 473.07, "r_y2": 270.89, "r_x3": 455.636, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.166, "r_y0": 279.442, "r_x1": 515.6, "r_y1": 279.442, "r_x2": 515.6, "r_y2": 270.89, "r_x3": 498.166, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 291.397, "r_x1": 377.863, "r_y1": 291.397, "r_x2": 377.863, "r_y2": 282.845, "r_x3": 326.795, "r_y3": 282.845, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.694, "r_y0": 291.397, "r_x1": 438.276, "r_y1": 291.397, "r_x2": 438.276, "r_y2": 282.845, "r_x3": 393.694, "r_y3": 282.845, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.631, "r_y0": 291.413, "r_x1": 473.066, "r_y1": 291.413, "r_x2": 473.066, "r_y2": 282.457, "r_x3": 455.631, "r_y3": 282.457, "coord_origin": "TOPLEFT"}, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.171, "r_y0": 291.413, "r_x1": 515.606, "r_y1": 291.413, "r_x2": 515.606, "r_y2": 282.457, "r_x3": 498.171, "r_y3": 282.457, "coord_origin": "TOPLEFT"}, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 303.352, "r_x1": 377.863, "r_y1": 303.352, "r_x2": 377.863, "r_y2": 294.8, "r_x3": 326.795, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 389.818, "r_y0": 303.352, "r_x1": 442.152, "r_y1": 303.352, "r_x2": 442.152, "r_y2": 294.8, "r_x3": 389.818, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.631, "r_y0": 303.352, "r_x1": 473.066, "r_y1": 303.352, "r_x2": 473.066, "r_y2": 294.8, "r_x3": 455.631, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 505.225, "r_y0": 303.352, "r_x1": 508.543, "r_y1": 303.352, "r_x2": 508.543, "r_y2": 294.8, "r_x3": 505.225, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 83, "label": "text", "bbox": {"l": 339.323, "t": 253.933, "r": 365.335, "b": 262.485, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.323, "r_y0": 262.485, "r_x1": 365.335, "r_y1": 262.485, "r_x2": 365.335, "r_y2": 253.933, "r_x3": 339.323, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 401.041, "t": 253.933, "r": 430.919, "b": 262.485, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 401.041, "r_y0": 262.485, "r_x1": 430.919, "r_y1": 262.485, "r_x2": 430.919, "r_y2": 253.933, "r_x3": 401.041, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 454.102, "t": 253.933, "r": 474.585, "b": 262.485, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 454.102, "r_y0": 262.485, "r_x1": 474.585, "r_y1": 262.485, "r_x2": 474.585, "r_y2": 253.933, "r_x3": 454.102, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "mAP", "orig": "mAP", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 86, "label": "text", "bbox": {"l": 486.54, "t": 253.933, "r": 527.228, "b": 262.485, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 486.54, "r_y0": 262.485, "r_x1": 527.228, "r_y1": 262.485, "r_x2": 527.228, "r_y2": 253.933, "r_x3": 486.54, "r_y3": 253.933, "coord_origin": "TOPLEFT"}, "text": "mAP (PP)", "orig": "mAP (PP)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 327.656, "t": 270.89, "r": 377.001, "b": 279.442, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.656, "r_y0": 279.442, "r_x1": 377.001, "r_y1": 279.442, "r_x2": 377.001, "r_y2": 270.89, "r_x3": 327.656, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "EDD+BBox", "orig": "EDD+BBox", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 88, "label": "text", "bbox": {"l": 393.698, "t": 270.89, "r": 438.281, "b": 279.442, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.698, "r_y0": 279.442, "r_x1": 438.281, "r_y1": 279.442, "r_x2": 438.281, "r_y2": 270.89, "r_x3": 393.698, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 455.636, "t": 270.89, "r": 473.07, "b": 279.442, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.636, "r_y0": 279.442, "r_x1": 473.07, "r_y1": 279.442, "r_x2": 473.07, "r_y2": 270.89, "r_x3": 455.636, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "79.2", "orig": "79.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 498.166, "t": 270.89, "r": 515.6, "b": 279.442, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.166, "r_y0": 279.442, "r_x1": 515.6, "r_y1": 279.442, "r_x2": 515.6, "r_y2": 270.89, "r_x3": 498.166, "r_y3": 270.89, "coord_origin": "TOPLEFT"}, "text": "82.7", "orig": "82.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 91, "label": "text", "bbox": {"l": 326.795, "t": 282.845, "r": 377.863, "b": 291.397, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 291.397, "r_x1": 377.863, "r_y1": 291.397, "r_x2": 377.863, "r_y2": 282.845, "r_x3": 326.795, "r_y3": 282.845, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 92, "label": "text", "bbox": {"l": 393.694, "t": 282.845, "r": 438.276, "b": 291.397, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.694, "r_y0": 291.397, "r_x1": 438.276, "r_y1": 291.397, "r_x2": 438.276, "r_y2": 282.845, "r_x3": 393.694, "r_y3": 282.845, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 93, "label": "text", "bbox": {"l": 455.631, "t": 282.457, "r": 473.066, "b": 291.413, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.631, "r_y0": 291.413, "r_x1": 473.066, "r_y1": 291.413, "r_x2": 473.066, "r_y2": 282.457, "r_x3": 455.631, "r_y3": 282.457, "coord_origin": "TOPLEFT"}, "text": "82.1", "orig": "82.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 94, "label": "text", "bbox": {"l": 498.171, "t": 282.457, "r": 515.606, "b": 291.413, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.171, "r_y0": 291.413, "r_x1": 515.606, "r_y1": 291.413, "r_x2": 515.606, "r_y2": 282.457, "r_x3": 498.171, "r_y3": 282.457, "coord_origin": "TOPLEFT"}, "text": "86.8", "orig": "86.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 95, "label": "text", "bbox": {"l": 326.795, "t": 294.8, "r": 377.863, "b": 303.352, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 303.352, "r_x1": 377.863, "r_y1": 303.352, "r_x2": 377.863, "r_y2": 294.8, "r_x3": 326.795, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 96, "label": "text", "bbox": {"l": 389.818, "t": 294.8, "r": 442.152, "b": 303.352, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 389.818, "r_y0": 303.352, "r_x1": 442.152, "r_y1": 303.352, "r_x2": 442.152, "r_y2": 294.8, "r_x3": 389.818, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "SynthTabNet", "orig": "SynthTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 97, "label": "text", "bbox": {"l": 455.631, "t": 294.8, "r": 473.066, "b": 303.352, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.631, "r_y0": 303.352, "r_x1": 473.066, "r_y1": 303.352, "r_x2": 473.066, "r_y2": 294.8, "r_x3": 455.631, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "87.7", "orig": "87.7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 98, "label": "text", "bbox": {"l": 505.225, "t": 294.8, "r": 508.543, "b": 303.352, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 505.225, "r_y0": 303.352, "r_x1": 508.543, "r_y1": 303.352, "r_x2": 508.543, "r_y2": 294.8, "r_x3": 505.225, "r_y3": 294.8, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 4, "num_cols": 4, "table_cells": [{"bbox": {"l": 339.323, "t": 253.933, "r": 365.335, "b": 262.485, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 401.041, "t": 253.933, "r": 430.919, "b": 262.485, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Dataset", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 454.102, "t": 253.933, "r": 474.585, "b": 262.485, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "mAP", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 486.54, "t": 253.933, "r": 527.228, "b": 262.485, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "mAP (PP)", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 327.656, "t": 270.89, "r": 377.001, "b": 279.442, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD+BBox", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 393.698, "t": 270.89, "r": 438.281, "b": 279.442, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 455.636, "t": 270.89, "r": 473.07, "b": 279.442, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "79.2", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 498.166, "t": 270.89, "r": 515.6, "b": 279.442, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "82.7", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 326.795, "t": 282.845, "r": 377.863, "b": 291.397, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 393.694, "t": 282.845, "r": 438.276, "b": 291.397, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "PubTabNet", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 455.631, "t": 282.457, "r": 473.066, "b": 291.413, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "82.1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 498.171, "t": 282.457, "r": 515.606, "b": 291.413, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "86.8", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 326.795, "t": 294.8, "r": 377.863, "b": 303.352, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 389.818, "t": 294.8, "r": 442.152, "b": 303.352, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "SynthTabNet", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 455.631, "t": 294.8, "r": 473.066, "b": 303.352, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "87.7", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 505.225, "t": 294.8, "r": 508.543, "b": 303.352, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "-", "column_header": false, "row_header": false, "row_section": false}]}, {"label": "caption", "id": 12, "page_no": 6, "cluster": {"id": 12, "label": "caption", "bbox": {"l": 308.862, "t": 316.718, "r": 545.115, "b": 337.225, "coord_origin": "TOPLEFT"}, "confidence": 0.9519917964935303, "cells": [{"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 325.27, "r_x1": 341.499, "r_y1": 325.27, "r_x2": 341.499, "r_y2": 316.718, "r_x3": 308.862, "r_y3": 316.718, "coord_origin": "TOPLEFT"}, "text": "Table 3:", "orig": "Table 3:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 348.603, "r_y0": 325.27, "r_x1": 545.115, "r_y1": 325.27, "r_x2": 545.115, "r_y2": 316.718, "r_x3": 348.603, "r_y3": 316.718, "coord_origin": "TOPLEFT"}, "text": "Cell Bounding Box detection results on PubTab-", "orig": "Cell Bounding Box detection results on PubTab-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 337.225, "r_x1": 474.978, "r_y1": 337.225, "r_x2": 474.978, "r_y2": 328.673, "r_x3": 308.862, "r_y3": 328.673, "coord_origin": "TOPLEFT"}, "text": "Net, and FinTabNet. PP: Post-processing.", "orig": "Net, and FinTabNet. PP: Post-processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table 3: Cell Bounding Box detection results on PubTabNet, and FinTabNet. PP: Post-processing."}, {"label": "text", "id": 4, "page_no": 6, "cluster": {"id": 4, "label": "text", "bbox": {"l": 308.862, "t": 367.68, "r": 545.116, "b": 520.082, "coord_origin": "TOPLEFT"}, "confidence": 0.9835010766983032, "cells": [{"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 376.636, "r_x1": 378.949, "r_y1": 376.636, "r_x2": 378.949, "r_y2": 367.68, "r_x3": 320.817, "r_y3": 367.68, "coord_origin": "TOPLEFT"}, "text": "Cell Content.", "orig": "Cell Content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 387.079, "r_y0": 376.62, "r_x1": 395.378, "r_y1": 376.62, "r_x2": 395.378, "r_y2": 368.068, "r_x3": 387.079, "r_y3": 368.068, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 399.552, "r_y0": 376.62, "r_x1": 413.948, "r_y1": 376.62, "r_x2": 413.948, "r_y2": 368.068, "r_x3": 399.552, "r_y3": 368.068, "coord_origin": "TOPLEFT"}, "text": "this", "orig": "this", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 418.112, "r_y0": 376.62, "r_x1": 448.827, "r_y1": 376.62, "r_x2": 448.827, "r_y2": 368.068, "r_x3": 418.112, "r_y3": 368.068, "coord_origin": "TOPLEFT"}, "text": "section,", "orig": "section,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.42, "r_y0": 376.62, "r_x1": 545.116, "r_y1": 376.62, "r_x2": 545.116, "r_y2": 368.068, "r_x3": 453.42, "r_y3": 368.068, "coord_origin": "TOPLEFT"}, "text": "we evaluate the entire", "orig": "we evaluate the entire", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 388.575, "r_x1": 487.193, "r_y1": 388.575, "r_x2": 487.193, "r_y2": 380.023, "r_x3": 308.862, "r_y3": 380.023, "coord_origin": "TOPLEFT"}, "text": "pipeline of recovering a table with content.", "orig": "pipeline of recovering a table with content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.967, "r_y0": 388.575, "r_x1": 545.115, "r_y1": 388.575, "r_x2": 545.115, "r_y2": 380.023, "r_x3": 493.967, "r_y3": 380.023, "coord_origin": "TOPLEFT"}, "text": "Here we put", "orig": "Here we put", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 400.53, "r_x1": 545.115, "r_y1": 400.53, "r_x2": 545.115, "r_y2": 391.978, "r_x3": 308.862, "r_y3": 391.978, "coord_origin": "TOPLEFT"}, "text": "our approach to test by capitalizing on extracting content", "orig": "our approach to test by capitalizing on extracting content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 412.486, "r_x1": 545.115, "r_y1": 412.486, "r_x2": 545.115, "r_y2": 403.934, "r_x3": 308.862, "r_y3": 403.934, "coord_origin": "TOPLEFT"}, "text": "from the PDF cells rather than decoding from images. Tab.", "orig": "from the PDF cells rather than decoding from images. Tab.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 424.441, "r_x1": 545.115, "r_y1": 424.441, "r_x2": 545.115, "r_y2": 415.889, "r_x3": 308.862, "r_y3": 415.889, "coord_origin": "TOPLEFT"}, "text": "4 shows the TEDs score of HTML code representing the", "orig": "4 shows the TEDs score of HTML code representing the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 436.396, "r_x1": 545.115, "r_y1": 436.396, "r_x2": 545.115, "r_y2": 427.844, "r_x3": 308.862, "r_y3": 427.844, "coord_origin": "TOPLEFT"}, "text": "structure of the table along with the content inserted in the", "orig": "structure of the table along with the content inserted in the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 203, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 448.351, "r_x1": 545.115, "r_y1": 448.351, "r_x2": 545.115, "r_y2": 439.799, "r_x3": 308.862, "r_y3": 439.799, "coord_origin": "TOPLEFT"}, "text": "data cell and compared with the ground-truth. Our method", "orig": "data cell and compared with the ground-truth. Our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 204, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 460.306, "r_x1": 350.237, "r_y1": 460.306, "r_x2": 350.237, "r_y2": 451.754, "r_x3": 308.862, "r_y3": 451.754, "coord_origin": "TOPLEFT"}, "text": "achieved a", "orig": "achieved a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 205, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 352.176, "r_y0": 460.322, "r_x1": 374.592, "r_y1": 460.322, "r_x2": 374.592, "r_y2": 451.366, "r_x3": 352.176, "r_y3": 451.366, "coord_origin": "TOPLEFT"}, "text": "5.3%", "orig": "5.3%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 206, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.533, "r_y0": 460.306, "r_x1": 545.11, "r_y1": 460.306, "r_x2": 545.11, "r_y2": 451.754, "r_x3": 376.533, "r_y3": 451.754, "coord_origin": "TOPLEFT"}, "text": "increase over the state-of-the-art, and com-", "orig": "increase over the state-of-the-art, and com-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 207, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 472.261, "r_x1": 380.523, "r_y1": 472.261, "r_x2": 380.523, "r_y2": 463.709, "r_x3": 308.862, "r_y3": 463.709, "coord_origin": "TOPLEFT"}, "text": "mercial solutions.", "orig": "mercial solutions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 208, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 386.042, "r_y0": 472.261, "r_x1": 545.115, "r_y1": 472.261, "r_x2": 545.115, "r_y2": 463.709, "r_x3": 386.042, "r_y3": 463.709, "coord_origin": "TOPLEFT"}, "text": "We believe our scores would be higher", "orig": "We believe our scores would be higher", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 209, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 484.217, "r_x1": 314.949, "r_y1": 484.217, "r_x2": 314.949, "r_y2": 475.665, "r_x3": 308.862, "r_y3": 475.665, "coord_origin": "TOPLEFT"}, "text": "if", "orig": "if", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 210, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 318.008, "r_y0": 484.217, "r_x1": 545.115, "r_y1": 484.217, "r_x2": 545.115, "r_y2": 475.665, "r_x3": 318.008, "r_y3": 475.665, "coord_origin": "TOPLEFT"}, "text": "the HTML ground-truth matched the extracted PDF cell", "orig": "the HTML ground-truth matched the extracted PDF cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 211, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 496.172, "r_x1": 340.683, "r_y1": 496.172, "r_x2": 340.683, "r_y2": 487.62, "r_x3": 308.862, "r_y3": 487.62, "coord_origin": "TOPLEFT"}, "text": "content.", "orig": "content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 212, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.793, "r_y0": 496.172, "r_x1": 545.115, "r_y1": 496.172, "r_x2": 545.115, "r_y2": 487.62, "r_x3": 345.793, "r_y3": 487.62, "coord_origin": "TOPLEFT"}, "text": "Unfortunately, there are small discrepancies such", "orig": "Unfortunately, there are small discrepancies such", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 213, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 508.127, "r_x1": 545.115, "r_y1": 508.127, "r_x2": 545.115, "r_y2": 499.575, "r_x3": 308.862, "r_y3": 499.575, "coord_origin": "TOPLEFT"}, "text": "as spacings around words or special characters with various", "orig": "as spacings around words or special characters with various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 214, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 520.082, "r_x1": 405.698, "r_y1": 520.082, "r_x2": 405.698, "r_y2": 511.53, "r_x3": 308.862, "r_y3": 511.53, "coord_origin": "TOPLEFT"}, "text": "unicode representations.", "orig": "unicode representations.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Cell Content. In this section, we evaluate the entire pipeline of recovering a table with content. Here we put our approach to test by capitalizing on extracting content from the PDF cells rather than decoding from images. Tab. 4 shows the TEDs score of HTML code representing the structure of the table along with the content inserted in the data cell and compared with the ground-truth. Our method achieved a 5.3% increase over the state-of-the-art, and commercial solutions. We believe our scores would be higher if the HTML ground-truth matched the extracted PDF cell content. Unfortunately, there are small discrepancies such as spacings around words or special characters with various unicode representations."}, {"label": "table", "id": 5, "page_no": 6, "cluster": {"id": 5, "label": "table", "bbox": {"l": 332.9688720703125, "t": 540.2835693359375, "r": 520.942138671875, "b": 643.2697143554688, "coord_origin": "TOPLEFT"}, "confidence": 0.9775567650794983, "cells": [{"index": 215, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 358.011, "r_y0": 561.054, "r_x1": 384.023, "r_y1": 561.054, "r_x2": 384.023, "r_y2": 552.502, "r_x3": 358.011, "r_y3": 552.502, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 216, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.034, "r_y0": 555.076, "r_x1": 473.94, "r_y1": 555.076, "r_x2": 473.94, "r_y2": 546.524, "r_x3": 449.034, "r_y3": 546.524, "coord_origin": "TOPLEFT"}, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 217, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.506, "r_y0": 567.031, "r_x1": 436.74, "r_y1": 567.031, "r_x2": 436.74, "r_y2": 558.479, "r_x3": 408.506, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 218, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.695, "r_y0": 567.031, "r_x1": 485.079, "r_y1": 567.031, "r_x2": 485.079, "r_y2": 558.479, "r_x3": 448.695, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 219, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 499.385, "r_y0": 567.031, "r_x1": 512.117, "r_y1": 567.031, "r_x2": 512.117, "r_y2": 558.479, "r_x3": 499.385, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 220, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.682, "r_y0": 583.988, "r_x1": 384.352, "r_y1": 583.988, "r_x2": 384.352, "r_y2": 575.436, "r_x3": 357.682, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 221, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.901, "r_y0": 583.988, "r_x1": 431.336, "r_y1": 583.988, "r_x2": 431.336, "r_y2": 575.436, "r_x3": 413.901, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 222, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 583.988, "r_x1": 475.599, "r_y1": 583.988, "r_x2": 475.599, "r_y2": 575.436, "r_x3": 458.165, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 223, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.029, "r_y0": 583.988, "r_x1": 514.463, "r_y1": 583.988, "r_x2": 514.463, "r_y2": 575.436, "r_x3": 497.029, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 224, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 350.723, "r_y0": 595.943, "r_x1": 391.311, "r_y1": 595.943, "r_x2": 391.311, "r_y2": 587.391, "r_x3": 350.723, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 225, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 595.943, "r_x1": 431.34, "r_y1": 595.943, "r_x2": 431.34, "r_y2": 587.391, "r_x3": 413.906, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 226, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 595.943, "r_x1": 475.604, "r_y1": 595.943, "r_x2": 475.604, "r_y2": 587.391, "r_x3": 458.17, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 227, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 595.943, "r_x1": 514.468, "r_y1": 595.943, "r_x2": 514.468, "r_y2": 587.391, "r_x3": 497.034, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 228, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.136, "r_y0": 607.899, "r_x1": 387.899, "r_y1": 607.899, "r_x2": 387.899, "r_y2": 599.347, "r_x3": 354.136, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 229, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.902, "r_y0": 607.899, "r_x1": 431.336, "r_y1": 607.899, "r_x2": 431.336, "r_y2": 599.347, "r_x3": 413.902, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 230, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 607.899, "r_x1": 475.6, "r_y1": 607.899, "r_x2": 475.6, "r_y2": 599.347, "r_x3": 458.165, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 231, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.03, "r_y0": 607.899, "r_x1": 514.464, "r_y1": 607.899, "r_x2": 514.464, "r_y2": 599.347, "r_x3": 497.03, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 232, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.559, "r_y0": 619.854, "r_x1": 395.475, "r_y1": 619.854, "r_x2": 395.475, "r_y2": 611.302, "r_x3": 346.559, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 233, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 619.854, "r_x1": 431.341, "r_y1": 619.854, "r_x2": 431.341, "r_y2": 611.302, "r_x3": 413.906, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 234, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 619.854, "r_x1": 475.605, "r_y1": 619.854, "r_x2": 475.605, "r_y2": 611.302, "r_x3": 458.17, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 235, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 619.854, "r_x1": 514.469, "r_y1": 619.854, "r_x2": 514.469, "r_y2": 611.302, "r_x3": 497.034, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 236, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.781, "r_y0": 631.809, "r_x1": 381.254, "r_y1": 631.809, "r_x2": 381.254, "r_y2": 623.2570000000001, "r_x3": 360.781, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 237, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.902, "r_y0": 631.809, "r_x1": 431.336, "r_y1": 631.809, "r_x2": 431.336, "r_y2": 623.2570000000001, "r_x3": 413.902, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 238, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 631.809, "r_x1": 475.6, "r_y1": 631.809, "r_x2": 475.6, "r_y2": 623.2570000000001, "r_x3": 458.165, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 239, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.03, "r_y0": 631.809, "r_x1": 514.464, "r_y1": 631.809, "r_x2": 514.464, "r_y2": 623.2570000000001, "r_x3": 497.03, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 240, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.483, "r_y0": 643.764, "r_x1": 396.551, "r_y1": 643.764, "r_x2": 396.551, "r_y2": 635.212, "r_x3": 345.483, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 241, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 643.764, "r_x1": 431.341, "r_y1": 643.764, "r_x2": 431.341, "r_y2": 635.212, "r_x3": 413.906, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 242, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 643.764, "r_x1": 475.605, "r_y1": 643.764, "r_x2": 475.605, "r_y2": 635.212, "r_x3": 458.17, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 243, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 643.78, "r_x1": 514.469, "r_y1": 643.78, "r_x2": 514.469, "r_y2": 634.8240000000001, "r_x3": 497.034, "r_y3": 634.8240000000001, "coord_origin": "TOPLEFT"}, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 99, "label": "text", "bbox": {"l": 358.011, "t": 552.502, "r": 384.023, "b": 561.054, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 215, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 358.011, "r_y0": 561.054, "r_x1": 384.023, "r_y1": 561.054, "r_x2": 384.023, "r_y2": 552.502, "r_x3": 358.011, "r_y3": 552.502, "coord_origin": "TOPLEFT"}, "text": "Model", "orig": "Model", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 100, "label": "text", "bbox": {"l": 449.034, "t": 546.524, "r": 473.94, "b": 555.076, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 216, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 449.034, "r_y0": 555.076, "r_x1": 473.94, "r_y1": 555.076, "r_x2": 473.94, "r_y2": 546.524, "r_x3": 449.034, "r_y3": 546.524, "coord_origin": "TOPLEFT"}, "text": "TEDS", "orig": "TEDS", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 101, "label": "text", "bbox": {"l": 408.506, "t": 558.479, "r": 436.74, "b": 567.031, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 217, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.506, "r_y0": 567.031, "r_x1": 436.74, "r_y1": 567.031, "r_x2": 436.74, "r_y2": 558.479, "r_x3": 408.506, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 102, "label": "text", "bbox": {"l": 448.695, "t": 558.479, "r": 485.079, "b": 567.031, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 218, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.695, "r_y0": 567.031, "r_x1": 485.079, "r_y1": 567.031, "r_x2": 485.079, "r_y2": 558.479, "r_x3": 448.695, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 103, "label": "text", "bbox": {"l": 499.385, "t": 558.479, "r": 512.117, "b": 567.031, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 219, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 499.385, "r_y0": 567.031, "r_x1": 512.117, "r_y1": 567.031, "r_x2": 512.117, "r_y2": 558.479, "r_x3": 499.385, "r_y3": 558.479, "coord_origin": "TOPLEFT"}, "text": "All", "orig": "All", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 104, "label": "text", "bbox": {"l": 357.682, "t": 575.436, "r": 384.352, "b": 583.988, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 220, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.682, "r_y0": 583.988, "r_x1": 384.352, "r_y1": 583.988, "r_x2": 384.352, "r_y2": 575.436, "r_x3": 357.682, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "Tabula", "orig": "Tabula", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 105, "label": "text", "bbox": {"l": 413.901, "t": 575.436, "r": 431.336, "b": 583.988, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 221, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.901, "r_y0": 583.988, "r_x1": 431.336, "r_y1": 583.988, "r_x2": 431.336, "r_y2": 575.436, "r_x3": 413.901, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "78.0", "orig": "78.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 106, "label": "text", "bbox": {"l": 458.165, "t": 575.436, "r": 475.599, "b": 583.988, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 222, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 583.988, "r_x1": 475.599, "r_y1": 583.988, "r_x2": 475.599, "r_y2": 575.436, "r_x3": 458.165, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "57.8", "orig": "57.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 107, "label": "text", "bbox": {"l": 497.029, "t": 575.436, "r": 514.463, "b": 583.988, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 223, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.029, "r_y0": 583.988, "r_x1": 514.463, "r_y1": 583.988, "r_x2": 514.463, "r_y2": 575.436, "r_x3": 497.029, "r_y3": 575.436, "coord_origin": "TOPLEFT"}, "text": "67.9", "orig": "67.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 108, "label": "text", "bbox": {"l": 350.723, "t": 587.391, "r": 391.311, "b": 595.943, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 224, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 350.723, "r_y0": 595.943, "r_x1": 391.311, "r_y1": 595.943, "r_x2": 391.311, "r_y2": 587.391, "r_x3": 350.723, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "Traprange", "orig": "Traprange", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 109, "label": "text", "bbox": {"l": 413.906, "t": 587.391, "r": 431.34, "b": 595.943, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 225, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 595.943, "r_x1": 431.34, "r_y1": 595.943, "r_x2": 431.34, "r_y2": 587.391, "r_x3": 413.906, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "60.8", "orig": "60.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 110, "label": "text", "bbox": {"l": 458.17, "t": 587.391, "r": 475.604, "b": 595.943, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 226, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 595.943, "r_x1": 475.604, "r_y1": 595.943, "r_x2": 475.604, "r_y2": 587.391, "r_x3": 458.17, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "49.9", "orig": "49.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 111, "label": "text", "bbox": {"l": 497.034, "t": 587.391, "r": 514.468, "b": 595.943, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 227, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 595.943, "r_x1": 514.468, "r_y1": 595.943, "r_x2": 514.468, "r_y2": 587.391, "r_x3": 497.034, "r_y3": 587.391, "coord_origin": "TOPLEFT"}, "text": "55.4", "orig": "55.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 112, "label": "text", "bbox": {"l": 354.136, "t": 599.347, "r": 387.899, "b": 607.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 228, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.136, "r_y0": 607.899, "r_x1": 387.899, "r_y1": 607.899, "r_x2": 387.899, "r_y2": 599.347, "r_x3": 354.136, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "Camelot", "orig": "Camelot", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 113, "label": "text", "bbox": {"l": 413.902, "t": 599.347, "r": 431.336, "b": 607.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 229, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.902, "r_y0": 607.899, "r_x1": 431.336, "r_y1": 607.899, "r_x2": 431.336, "r_y2": 599.347, "r_x3": 413.902, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "80.0", "orig": "80.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 114, "label": "text", "bbox": {"l": 458.165, "t": 599.347, "r": 475.6, "b": 607.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 230, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 607.899, "r_x1": 475.6, "r_y1": 607.899, "r_x2": 475.6, "r_y2": 599.347, "r_x3": 458.165, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "66.0", "orig": "66.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 115, "label": "text", "bbox": {"l": 497.03, "t": 599.347, "r": 514.464, "b": 607.899, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 231, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.03, "r_y0": 607.899, "r_x1": 514.464, "r_y1": 607.899, "r_x2": 514.464, "r_y2": 599.347, "r_x3": 497.03, "r_y3": 599.347, "coord_origin": "TOPLEFT"}, "text": "73.0", "orig": "73.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 116, "label": "text", "bbox": {"l": 346.559, "t": 611.302, "r": 395.475, "b": 619.854, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 232, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.559, "r_y0": 619.854, "r_x1": 395.475, "r_y1": 619.854, "r_x2": 395.475, "r_y2": 611.302, "r_x3": 346.559, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "Acrobat Pro", "orig": "Acrobat Pro", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 117, "label": "text", "bbox": {"l": 413.906, "t": 611.302, "r": 431.341, "b": 619.854, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 233, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 619.854, "r_x1": 431.341, "r_y1": 619.854, "r_x2": 431.341, "r_y2": 611.302, "r_x3": 413.906, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "68.9", "orig": "68.9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 118, "label": "text", "bbox": {"l": 458.17, "t": 611.302, "r": 475.605, "b": 619.854, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 234, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 619.854, "r_x1": 475.605, "r_y1": 619.854, "r_x2": 475.605, "r_y2": 611.302, "r_x3": 458.17, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "61.8", "orig": "61.8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 119, "label": "text", "bbox": {"l": 497.034, "t": 611.302, "r": 514.469, "b": 619.854, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 235, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 619.854, "r_x1": 514.469, "r_y1": 619.854, "r_x2": 514.469, "r_y2": 611.302, "r_x3": 497.034, "r_y3": 611.302, "coord_origin": "TOPLEFT"}, "text": "65.3", "orig": "65.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 120, "label": "text", "bbox": {"l": 360.781, "t": 623.2570000000001, "r": 381.254, "b": 631.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 236, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.781, "r_y0": 631.809, "r_x1": 381.254, "r_y1": 631.809, "r_x2": 381.254, "r_y2": 623.2570000000001, "r_x3": 360.781, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "EDD", "orig": "EDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 121, "label": "text", "bbox": {"l": 413.902, "t": 623.2570000000001, "r": 431.336, "b": 631.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 237, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.902, "r_y0": 631.809, "r_x1": 431.336, "r_y1": 631.809, "r_x2": 431.336, "r_y2": 623.2570000000001, "r_x3": 413.902, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "91.2", "orig": "91.2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 122, "label": "text", "bbox": {"l": 458.165, "t": 623.2570000000001, "r": 475.6, "b": 631.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 238, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.165, "r_y0": 631.809, "r_x1": 475.6, "r_y1": 631.809, "r_x2": 475.6, "r_y2": 623.2570000000001, "r_x3": 458.165, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "85.4", "orig": "85.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 123, "label": "text", "bbox": {"l": 497.03, "t": 623.2570000000001, "r": 514.464, "b": 631.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 239, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.03, "r_y0": 631.809, "r_x1": 514.464, "r_y1": 631.809, "r_x2": 514.464, "r_y2": 623.2570000000001, "r_x3": 497.03, "r_y3": 623.2570000000001, "coord_origin": "TOPLEFT"}, "text": "88.3", "orig": "88.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 124, "label": "text", "bbox": {"l": 345.483, "t": 635.212, "r": 396.551, "b": 643.764, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 240, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.483, "r_y0": 643.764, "r_x1": 396.551, "r_y1": 643.764, "r_x2": 396.551, "r_y2": 635.212, "r_x3": 345.483, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "TableFormer", "orig": "TableFormer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 125, "label": "text", "bbox": {"l": 413.906, "t": 635.212, "r": 431.341, "b": 643.764, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 241, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 413.906, "r_y0": 643.764, "r_x1": 431.341, "r_y1": 643.764, "r_x2": 431.341, "r_y2": 635.212, "r_x3": 413.906, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "95.4", "orig": "95.4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 126, "label": "text", "bbox": {"l": 458.17, "t": 635.212, "r": 475.605, "b": 643.764, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 242, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.17, "r_y0": 643.764, "r_x1": 475.605, "r_y1": 643.764, "r_x2": 475.605, "r_y2": 635.212, "r_x3": 458.17, "r_y3": 635.212, "coord_origin": "TOPLEFT"}, "text": "90.1", "orig": "90.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 127, "label": "text", "bbox": {"l": 497.034, "t": 634.8240000000001, "r": 514.469, "b": 643.78, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 243, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 497.034, "r_y0": 643.78, "r_x1": 514.469, "r_y1": 643.78, "r_x2": 514.469, "r_y2": 634.8240000000001, "r_x3": 497.034, "r_y3": 634.8240000000001, "coord_origin": "TOPLEFT"}, "text": "93.6", "orig": "93.6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["fcel", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 7, "num_cols": 4, "table_cells": [{"bbox": {"l": 358.011, "t": 552.502, "r": 384.023, "b": 561.054, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Model", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 448.695, "t": 546.524, "r": 485.079, "b": 567.031, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "TEDS Complex", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 408.506, "t": 558.479, "r": 436.74, "b": 567.031, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "Simple", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 499.385, "t": 558.479, "r": 512.117, "b": 567.031, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "All", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 357.682, "t": 575.436, "r": 384.352, "b": 583.988, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Tabula", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 413.901, "t": 575.436, "r": 431.336, "b": 583.988, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "78.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 458.165, "t": 575.436, "r": 475.599, "b": 583.988, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "57.8", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 497.029, "t": 575.436, "r": 514.463, "b": 583.988, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "67.9", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 350.723, "t": 587.391, "r": 391.311, "b": 595.943, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Traprange", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 413.906, "t": 587.391, "r": 431.34, "b": 595.943, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "60.8", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 458.17, "t": 587.391, "r": 475.604, "b": 595.943, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "49.9", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 497.034, "t": 587.391, "r": 514.468, "b": 595.943, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "55.4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 354.136, "t": 599.347, "r": 387.899, "b": 607.899, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Camelot", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 413.902, "t": 599.347, "r": 431.336, "b": 607.899, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "80.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 458.165, "t": 599.347, "r": 475.6, "b": 607.899, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "66.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 497.03, "t": 599.347, "r": 514.464, "b": 607.899, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "73.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 346.559, "t": 611.302, "r": 395.475, "b": 619.854, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Acrobat Pro", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 413.906, "t": 611.302, "r": 431.341, "b": 619.854, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "68.9", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 458.17, "t": 611.302, "r": 475.605, "b": 619.854, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "61.8", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 497.034, "t": 611.302, "r": 514.469, "b": 619.854, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "65.3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 360.781, "t": 623.2570000000001, "r": 381.254, "b": 631.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "EDD", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 413.902, "t": 623.2570000000001, "r": 431.336, "b": 631.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "91.2", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 458.165, "t": 623.2570000000001, "r": 475.6, "b": 631.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "85.4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 497.03, "t": 623.2570000000001, "r": 514.464, "b": 631.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "88.3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 345.483, "t": 635.212, "r": 396.551, "b": 643.764, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "TableFormer", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 413.906, "t": 635.212, "r": 431.341, "b": 643.764, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "95.4", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 458.17, "t": 635.212, "r": 475.605, "b": 643.764, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "90.1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 497.034, "t": 634.8240000000001, "r": 514.469, "b": 643.78, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "93.6", "column_header": false, "row_header": false, "row_section": false}]}, {"label": "caption", "id": 11, "page_no": 6, "cluster": {"id": 11, "label": "caption", "bbox": {"l": 308.862, "t": 657.13, "r": 545.115, "b": 689.592, "coord_origin": "TOPLEFT"}, "confidence": 0.9541404247283936, "cells": [{"index": 244, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 665.682, "r_x1": 341.739, "r_y1": 665.682, "r_x2": 341.739, "r_y2": 657.13, "r_x3": 308.862, "r_y3": 657.13, "coord_origin": "TOPLEFT"}, "text": "Table 4:", "orig": "Table 4:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 245, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 349.559, "r_y0": 665.682, "r_x1": 545.115, "r_y1": 665.682, "r_x2": 545.115, "r_y2": 657.13, "r_x3": 349.559, "r_y3": 657.13, "coord_origin": "TOPLEFT"}, "text": "Results of structure with content retrieved using", "orig": "Results of structure with content retrieved using", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 246, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 677.637, "r_x1": 425.763, "r_y1": 677.637, "r_x2": 425.763, "r_y2": 669.085, "r_x3": 308.862, "r_y3": 669.085, "coord_origin": "TOPLEFT"}, "text": "cell detection on PubTabNet.", "orig": "cell detection on PubTabNet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 247, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 430.336, "r_y0": 677.637, "r_x1": 545.115, "r_y1": 677.637, "r_x2": 545.115, "r_y2": 669.085, "r_x3": 430.336, "r_y3": 669.085, "coord_origin": "TOPLEFT"}, "text": "In all cases the input is PDF", "orig": "In all cases the input is PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 248, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 689.592, "r_x1": 435.038, "r_y1": 689.592, "r_x2": 435.038, "r_y2": 681.04, "r_x3": 308.862, "r_y3": 681.04, "coord_origin": "TOPLEFT"}, "text": "documents with cropped tables.", "orig": "documents with cropped tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Table 4: Results of structure with content retrieved using cell detection on PubTabNet. In all cases the input is PDF documents with cropped tables."}], "headers": [{"label": "page_footer", "id": 14, "page_no": 6, "cluster": {"id": 14, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8787972331047058, "cells": [{"index": 249, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "7"}]}}, {"page_no": 7, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.812, "r_y0": 216.02300000000002, "r_x1": 385.934, "r_y1": 216.02300000000002, "r_x2": 385.934, "r_y2": 208.54100000000005, "r_x3": 53.812, "r_y3": 208.54100000000005, "coord_origin": "TOPLEFT"}, "text": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:", "orig": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.812, "r_y0": 102.07100000000003, "r_x1": 284.346, "r_y1": 102.07100000000003, "r_x2": 284.346, "r_y2": 94.58900000000006, "r_x3": 53.812, "r_y3": 94.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Japanese language (previously unseen by TableFormer):", "orig": "Japanese language (previously unseen by TableFormer):", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 304.831, "r_y0": 102.07100000000003, "r_x1": 431.091, "r_y1": 102.07100000000003, "r_x2": 431.091, "r_y2": 94.58900000000006, "r_x3": 304.831, "r_y3": 94.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Example table from FinTabNet:", "orig": "Example table from FinTabNet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.286, "r_y0": 86.47699999999998, "r_x1": 499.556, "r_y1": 86.47699999999998, "r_x2": 499.556, "r_y2": 78.995, "r_x3": 53.286, "r_y3": 78.995, "coord_origin": "TOPLEFT"}, "text": "a. Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "orig": "a. Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.933, "r_y0": 226.00400000000002, "r_x1": 223.873, "r_y1": 226.00400000000002, "r_x2": 223.873, "r_y2": 221.35799999999995, "r_x3": 209.933, "r_y3": 221.35799999999995, "coord_origin": "TOPLEFT"}, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.765, "r_y0": 226.00400000000002, "r_x1": 273.058, "r_y1": 226.00400000000002, "r_x2": 273.058, "r_y2": 221.35799999999995, "r_x3": 263.765, "r_y3": 221.35799999999995, "coord_origin": "TOPLEFT"}, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.25, "r_y0": 233.49, "r_x1": 114.896, "r_y1": 233.49, "r_x2": 114.896, "r_y2": 228.84400000000005, "r_x3": 110.25, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.366, "r_y0": 233.49, "r_x1": 186.983, "r_y1": 233.49, "r_x2": 186.983, "r_y2": 228.84400000000005, "r_x3": 175.366, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u30d5\u30a1\u30a4\u30eb\u6570", "orig": "\u30d5\u30a1\u30a4\u30eb\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.314, "r_y0": 233.49, "r_x1": 199.961, "r_y1": 233.49, "r_x2": 199.961, "r_y2": 228.84400000000005, "r_x3": 195.314, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.198, "r_y0": 233.49, "r_x1": 236.168, "r_y1": 233.49, "r_x2": 236.168, "r_y2": 228.84400000000005, "r_x3": 229.198, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.114, "r_y0": 233.49, "r_x1": 260.761, "r_y1": 233.49, "r_x2": 260.761, "r_y2": 228.84400000000005, "r_x3": 256.114, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.384, "r_y0": 233.49, "r_x1": 285.354, "r_y1": 233.49, "r_x2": 285.354, "r_y2": 228.84400000000005, "r_x3": 278.384, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 240.76800000000003, "r_x1": 162.713, "r_y1": 240.76800000000003, "r_x2": 162.713, "r_y2": 236.48199999999997, "r_x3": 55.531, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.397, "r_y0": 240.76800000000003, "r_x1": 189.565, "r_y1": 240.76800000000003, "r_x2": 189.565, "r_y2": 236.48199999999997, "r_x3": 184.397, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.99, "r_y0": 240.76800000000003, "r_x1": 214.158, "r_y1": 240.76800000000003, "r_x2": 214.158, "r_y2": 236.48199999999997, "r_x3": 208.99, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.875, "r_y0": 240.76800000000003, "r_x1": 237.458, "r_y1": 240.76800000000003, "r_x2": 237.458, "r_y2": 236.48199999999997, "r_x3": 234.875, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 240.76800000000003, "r_x1": 264.636, "r_y1": 240.76800000000003, "r_x2": 264.636, "r_y2": 236.48199999999997, "r_x3": 256.884, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.061, "r_y0": 240.76800000000003, "r_x1": 286.644, "r_y1": 240.76800000000003, "r_x2": 286.644, "r_y2": 236.48199999999997, "r_x3": 284.061, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 246.962, "r_x1": 139.722, "r_y1": 246.962, "r_x2": 139.722, "r_y2": 242.67600000000004, "r_x3": 55.531, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 246.962, "r_x1": 190.857, "r_y1": 246.962, "r_x2": 190.857, "r_y2": 242.67600000000004, "r_x3": 183.105, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.698, "r_y0": 246.962, "r_x1": 215.45, "r_y1": 246.962, "r_x2": 215.45, "r_y2": 242.67600000000004, "r_x3": 207.698, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.875, "r_y0": 246.962, "r_x1": 237.458, "r_y1": 246.962, "r_x2": 237.458, "r_y2": 242.67600000000004, "r_x3": 234.875, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 246.962, "r_x1": 264.636, "r_y1": 246.962, "r_x2": 264.636, "r_y2": 242.67600000000004, "r_x3": 256.884, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.061, "r_y0": 246.962, "r_x1": 286.644, "r_y1": 246.962, "r_x2": 286.644, "r_y2": 242.67600000000004, "r_x3": 284.061, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 253.62199999999996, "r_x1": 74.118, "r_y1": 253.62199999999996, "r_x2": 74.118, "r_y2": 248.976, "r_x3": 55.531, "r_y3": 248.976, "coord_origin": "TOPLEFT"}, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.698, "r_y0": 253.93100000000004, "r_x1": 103.034, "r_y1": 253.93100000000004, "r_x2": 103.034, "r_y2": 249.64499999999998, "r_x3": 92.698, "r_y3": 249.64499999999998, "coord_origin": "TOPLEFT"}, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.034, "r_y0": 253.62199999999996, "r_x1": 114.651, "r_y1": 253.62199999999996, "r_x2": 114.651, "r_y2": 248.976, "r_x3": 103.034, "r_y3": 248.976, "coord_origin": "TOPLEFT"}, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 253.15700000000004, "r_x1": 190.857, "r_y1": 253.15700000000004, "r_x2": 190.857, "r_y2": 248.87099999999998, "r_x3": 183.105, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 253.15700000000004, "r_x1": 212.865, "r_y1": 253.15700000000004, "r_x2": 212.865, "r_y2": 248.87099999999998, "r_x3": 210.282, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 253.15700000000004, "r_x1": 240.043, "r_y1": 253.15700000000004, "r_x2": 240.043, "r_y2": 248.87099999999998, "r_x3": 232.292, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 253.15700000000004, "r_x1": 264.636, "r_y1": 253.15700000000004, "r_x2": 264.636, "r_y2": 248.87099999999998, "r_x3": 256.884, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 253.15700000000004, "r_x1": 289.229, "r_y1": 253.15700000000004, "r_x2": 289.229, "r_y2": 248.87099999999998, "r_x3": 281.477, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 261.10699999999997, "r_x1": 71.794, "r_y1": 261.10699999999997, "r_x2": 71.794, "r_y2": 256.461, "r_x3": 55.531, "r_y3": 256.461, "coord_origin": "TOPLEFT"}, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.053, "r_y0": 261.41600000000005, "r_x1": 93.22, "r_y1": 261.41600000000005, "r_x2": 93.22, "r_y2": 257.13, "r_x3": 88.053, "r_y3": 257.13, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.22, "r_y0": 261.10699999999997, "r_x1": 104.837, "r_y1": 261.10699999999997, "r_x2": 104.837, "r_y2": 256.461, "r_x3": 93.22, "r_y3": 256.461, "coord_origin": "TOPLEFT"}, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.451, "r_y0": 261.41600000000005, "r_x1": 129.882, "r_y1": 261.41600000000005, "r_x2": 129.882, "r_y2": 257.13, "r_x3": 116.451, "r_y3": 257.13, "coord_origin": "TOPLEFT"}, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 260.64200000000005, "r_x1": 190.857, "r_y1": 260.64200000000005, "r_x2": 190.857, "r_y2": 256.356, "r_x3": 183.105, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 260.64200000000005, "r_x1": 212.865, "r_y1": 260.64200000000005, "r_x2": 212.865, "r_y2": 256.356, "r_x3": 210.282, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 260.64200000000005, "r_x1": 240.043, "r_y1": 260.64200000000005, "r_x2": 240.043, "r_y2": 256.356, "r_x3": 232.292, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 260.64200000000005, "r_x1": 264.636, "r_y1": 260.64200000000005, "r_x2": 264.636, "r_y2": 256.356, "r_x3": 256.884, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 260.64200000000005, "r_x1": 289.229, "r_y1": 260.64200000000005, "r_x2": 289.229, "r_y2": 256.356, "r_x3": 281.477, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 268.33399999999995, "r_x1": 57.854, "r_y1": 268.33399999999995, "r_x2": 57.854, "r_y2": 263.688, "r_x3": 55.531, "r_y3": 263.688, "coord_origin": "TOPLEFT"}, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.177, "r_y0": 268.644, "r_x1": 65.344, "r_y1": 268.644, "r_x2": 65.344, "r_y2": 264.35699999999997, "r_x3": 60.177, "r_y3": 264.35699999999997, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.344, "r_y0": 268.33399999999995, "r_x1": 90.902, "r_y1": 268.33399999999995, "r_x2": 90.902, "r_y2": 263.688, "r_x3": 65.344, "r_y3": 263.688, "coord_origin": "TOPLEFT"}, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.451, "r_y0": 268.644, "r_x1": 129.882, "r_y1": 268.644, "r_x2": 129.882, "r_y2": 264.35699999999997, "r_x3": 116.451, "r_y3": 264.35699999999997, "coord_origin": "TOPLEFT"}, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 267.869, "r_x1": 190.857, "r_y1": 267.869, "r_x2": 190.857, "r_y2": 263.58299999999997, "r_x3": 183.105, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 267.869, "r_x1": 212.865, "r_y1": 267.869, "r_x2": 212.865, "r_y2": 263.58299999999997, "r_x3": 210.282, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 267.869, "r_x1": 240.043, "r_y1": 267.869, "r_x2": 240.043, "r_y2": 263.58299999999997, "r_x3": 232.292, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 267.869, "r_x1": 264.636, "r_y1": 267.869, "r_x2": 264.636, "r_y2": 263.58299999999997, "r_x3": 256.884, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 267.869, "r_x1": 289.229, "r_y1": 267.869, "r_x2": 289.229, "r_y2": 263.58299999999997, "r_x3": 281.477, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 275.562, "r_x1": 78.765, "r_y1": 275.562, "r_x2": 78.765, "r_y2": 270.91600000000005, "r_x3": 55.531, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.99, "r_y0": 275.871, "r_x1": 109.742, "r_y1": 275.871, "r_x2": 109.742, "r_y2": 271.58500000000004, "r_x3": 101.99, "r_y3": 271.58500000000004, "coord_origin": "TOPLEFT"}, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 109.742, "r_y0": 275.562, "r_x1": 112.065, "r_y1": 275.562, "r_x2": 112.065, "r_y2": 270.91600000000005, "r_x3": 109.742, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 114.388, "r_y0": 275.871, "r_x1": 122.139, "r_y1": 275.871, "r_x2": 122.139, "r_y2": 271.58500000000004, "r_x3": 114.388, "r_y3": 271.58500000000004, "coord_origin": "TOPLEFT"}, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.14, "r_y0": 275.562, "r_x1": 124.463, "r_y1": 275.562, "r_x2": 124.463, "r_y2": 270.91600000000005, "r_x3": 122.14, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.397, "r_y0": 275.096, "r_x1": 189.565, "r_y1": 275.096, "r_x2": 189.565, "r_y2": 270.80999999999995, "r_x3": 184.397, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 275.096, "r_x1": 212.865, "r_y1": 275.096, "r_x2": 212.865, "r_y2": 270.80999999999995, "r_x3": 210.282, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.583, "r_y0": 275.096, "r_x1": 238.751, "r_y1": 275.096, "r_x2": 238.751, "r_y2": 270.80999999999995, "r_x3": 233.583, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 275.096, "r_x1": 264.636, "r_y1": 275.096, "r_x2": 264.636, "r_y2": 270.80999999999995, "r_x3": 256.884, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 275.096, "r_x1": 289.229, "r_y1": 275.096, "r_x2": 289.229, "r_y2": 270.80999999999995, "r_x3": 281.477, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 283.356, "r_x1": 68.686, "r_y1": 283.356, "r_x2": 68.686, "r_y2": 279.07000000000005, "r_x3": 55.531, "r_y3": 279.07000000000005, "coord_origin": "TOPLEFT"}, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 68.686, "r_y0": 283.047, "r_x1": 87.273, "r_y1": 283.047, "r_x2": 87.273, "r_y2": 278.40099999999995, "r_x3": 68.686, "r_y3": 278.40099999999995, "coord_origin": "TOPLEFT"}, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 282.323, "r_x1": 190.857, "r_y1": 282.323, "r_x2": 190.857, "r_y2": 278.03700000000003, "r_x3": 183.105, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.99, "r_y0": 282.323, "r_x1": 214.158, "r_y1": 282.323, "r_x2": 214.158, "r_y2": 278.03700000000003, "r_x3": 208.99, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.583, "r_y0": 282.323, "r_x1": 238.751, "r_y1": 282.323, "r_x2": 238.751, "r_y2": 278.03700000000003, "r_x3": 233.583, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 282.323, "r_x1": 264.636, "r_y1": 282.323, "r_x2": 264.636, "r_y2": 278.03700000000003, "r_x3": 256.884, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.769, "r_y0": 282.323, "r_x1": 287.937, "r_y1": 282.323, "r_x2": 287.937, "r_y2": 278.03700000000003, "r_x3": 282.769, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.615, "r_y0": 290.274, "r_x1": 171.938, "r_y1": 290.274, "r_x2": 171.938, "r_y2": 285.628, "r_x3": 169.615, "r_y3": 285.628, "coord_origin": "TOPLEFT"}, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 289.809, "r_x1": 190.857, "r_y1": 289.809, "r_x2": 190.857, "r_y2": 285.522, "r_x3": 183.105, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.698, "r_y0": 289.809, "r_x1": 215.45, "r_y1": 289.809, "r_x2": 215.45, "r_y2": 285.522, "r_x3": 207.698, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 289.809, "r_x1": 240.043, "r_y1": 289.809, "r_x2": 240.043, "r_y2": 285.522, "r_x3": 232.292, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.765, "r_y0": 289.809, "r_x1": 265.752, "r_y1": 289.809, "r_x2": 265.752, "r_y2": 285.522, "r_x3": 255.765, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 289.809, "r_x1": 289.229, "r_y1": 289.809, "r_x2": 289.229, "r_y2": 285.522, "r_x3": 281.477, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.427, "r_y0": 298.536, "r_x1": 549.422, "r_y1": 298.536, "r_x2": 549.422, "r_y2": 292.551, "r_x3": 380.427, "r_y3": 292.551, "coord_origin": "TOPLEFT"}, "text": "Text is aligned to match original for ease of viewing", "orig": "Text is aligned to match original for ease of viewing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.049, "r_y0": 226.67100000000005, "r_x1": 542.0, "r_y1": 226.67100000000005, "r_x2": 542.0, "r_y2": 221.68899999999996, "r_x3": 459.049, "r_y3": 221.68899999999996, "coord_origin": "TOPLEFT"}, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.822, "r_y0": 232.88099999999997, "r_x1": 507.226, "r_y1": 232.88099999999997, "r_x2": 507.226, "r_y2": 227.899, "r_x3": 493.822, "r_y3": 227.899, "coord_origin": "TOPLEFT"}, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.244, "r_y0": 241.79399999999998, "r_x1": 407.346, "r_y1": 241.79399999999998, "r_x2": 407.346, "r_y2": 236.812, "r_x3": 393.244, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.097, "r_y0": 226.62099999999998, "r_x1": 438.015, "r_y1": 226.62099999999998, "r_x2": 438.015, "r_y2": 221.639, "r_x3": 392.097, "r_y3": 221.639, "coord_origin": "TOPLEFT"}, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.183, "r_y0": 241.79399999999998, "r_x1": 440.988, "r_y1": 241.79399999999998, "r_x2": 440.988, "r_y2": 236.812, "r_x3": 427.183, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.383, "r_y0": 241.79399999999998, "r_x1": 482.485, "r_y1": 241.79399999999998, "r_x2": 482.485, "r_y2": 236.812, "r_x3": 468.383, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.926, "r_y0": 241.79399999999998, "r_x1": 530.73, "r_y1": 241.79399999999998, "r_x2": 530.73, "r_y2": 236.812, "r_x3": 516.926, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 249.65700000000004, "r_x1": 364.656, "r_y1": 249.65700000000004, "r_x2": 364.656, "r_y2": 244.67600000000004, "r_x3": 306.115, "r_y3": 244.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Nonvested on January 1", "orig": "Nonvested on January 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 249.96000000000004, "r_x1": 403.755, "r_y1": 249.96000000000004, "r_x2": 403.755, "r_y2": 244.97799999999995, "r_x3": 396.247, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "1.1", "orig": "1.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.818, "r_y0": 249.96000000000004, "r_x1": 437.327, "r_y1": 249.96000000000004, "r_x2": 437.327, "r_y2": 244.97799999999995, "r_x3": 429.818, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.529, "r_y0": 249.96000000000004, "r_x1": 483.55, "r_y1": 249.96000000000004, "r_x2": 483.55, "r_y2": 244.97799999999995, "r_x3": 465.529, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "90.10 $", "orig": "90.10 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.448, "r_y0": 249.96000000000004, "r_x1": 531.47, "r_y1": 249.96000000000004, "r_x2": 531.47, "r_y2": 244.97799999999995, "r_x3": 513.448, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 258.731, "r_x1": 325.627, "r_y1": 258.731, "r_x2": 325.627, "r_y2": 253.74900000000002, "r_x3": 306.115, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 258.731, "r_x1": 403.755, "r_y1": 258.731, "r_x2": 403.755, "r_y2": 253.74900000000002, "r_x3": 396.247, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.818, "r_y0": 258.731, "r_x1": 437.327, "r_y1": 258.731, "r_x2": 437.327, "r_y2": 253.74900000000002, "r_x3": 429.818, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.436, "r_y0": 258.731, "r_x1": 482.548, "r_y1": 258.731, "r_x2": 482.548, "r_y2": 253.74900000000002, "r_x3": 466.436, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 514.291, "r_y0": 258.731, "r_x1": 530.81, "r_y1": 258.731, "r_x2": 530.81, "r_y2": 253.74900000000002, "r_x3": 514.291, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 266.595, "r_x1": 322.629, "r_y1": 266.595, "r_x2": 322.629, "r_y2": 261.61300000000006, "r_x3": 306.115, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.432, "r_y0": 266.595, "r_x1": 405.536, "r_y1": 266.595, "r_x2": 405.536, "r_y2": 261.61300000000006, "r_x3": 394.432, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "(0.5)", "orig": "(0.5)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.702, "r_y0": 266.595, "r_x1": 438.806, "r_y1": 266.595, "r_x2": 438.806, "r_y2": 261.61300000000006, "r_x3": 427.702, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.555, "r_y0": 266.595, "r_x1": 482.07, "r_y1": 266.595, "r_x2": 482.07, "r_y2": 261.61300000000006, "r_x3": 468.555, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.019, "r_y0": 266.595, "r_x1": 529.534, "r_y1": 266.595, "r_x2": 529.534, "r_y2": 261.61300000000006, "r_x3": 516.019, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 274.688, "r_x1": 356.248, "r_y1": 274.688, "r_x2": 356.248, "r_y2": 269.706, "r_x3": 306.115, "r_y3": 269.706, "coord_origin": "TOPLEFT"}, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.432, "r_y0": 275.366, "r_x1": 405.536, "r_y1": 275.366, "r_x2": 405.536, "r_y2": 270.384, "r_x3": 394.432, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.028, "r_y0": 275.366, "r_x1": 436.428, "r_y1": 275.366, "r_x2": 436.428, "r_y2": 270.384, "r_x3": 431.028, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.831, "r_y0": 275.366, "r_x1": 482.35, "r_y1": 275.366, "r_x2": 482.35, "r_y2": 270.384, "r_x3": 465.831, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.019, "r_y0": 275.366, "r_x1": 529.534, "r_y1": 275.366, "r_x2": 529.534, "r_y2": 270.384, "r_x3": 516.019, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 283.532, "r_x1": 373.358, "r_y1": 283.532, "r_x2": 373.358, "r_y2": 278.55100000000004, "r_x3": 306.115, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 283.532, "r_x1": 403.755, "r_y1": 283.532, "r_x2": 403.755, "r_y2": 278.55100000000004, "r_x3": 396.247, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.516, "r_y0": 283.532, "r_x1": 437.025, "r_y1": 283.532, "r_x2": 437.025, "r_y2": 278.55100000000004, "r_x3": 429.516, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.714, "r_y0": 283.532, "r_x1": 484.74, "r_y1": 283.532, "r_x2": 484.74, "r_y2": 278.55100000000004, "r_x3": 463.714, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.995, "r_y0": 283.532, "r_x1": 534.02, "r_y1": 283.532, "r_x2": 534.02, "r_y2": 278.55100000000004, "r_x3": 512.995, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 329.698, "r_x1": 86.864, "r_y1": 329.698, "r_x2": 86.864, "r_y2": 321.146, "r_x3": 50.112, "r_y3": 321.146, "coord_origin": "TOPLEFT"}, "text": "Figure 5:", "orig": "Figure 5:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.918, "r_y0": 329.698, "r_x1": 545.114, "r_y1": 329.698, "r_x2": 545.114, "r_y2": 321.146, "r_x3": 93.918, "r_y3": 321.146, "coord_origin": "TOPLEFT"}, "text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 341.653, "r_x1": 545.114, "r_y1": 341.653, "r_x2": 545.114, "r_y2": 333.101, "r_x3": 50.112, "r_y3": 333.101, "coord_origin": "TOPLEFT"}, "text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 353.608, "r_x1": 545.114, "r_y1": 353.608, "r_x2": 545.114, "r_y2": 345.056, "r_x3": 50.112, "r_y3": 345.056, "coord_origin": "TOPLEFT"}, "text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 365.564, "r_x1": 139.795, "r_y1": 365.564, "r_x2": 139.795, "r_y2": 357.012, "r_x3": 50.112, "r_y3": 357.012, "coord_origin": "TOPLEFT"}, "text": "the FinTabNet dataset.", "orig": "the FinTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.263, "r_y0": 386.393, "r_x1": 342.078, "r_y1": 386.393, "r_x2": 342.078, "r_y2": 381.96, "r_x3": 220.263, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.715, "r_y0": 386.393, "r_x1": 85.657, "r_y1": 386.393, "r_x2": 85.657, "r_y2": 381.96, "r_x3": 53.715, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 406.686, "r_x1": 443.699, "r_y1": 406.686, "r_x2": 443.699, "r_y2": 401.109, "r_x3": 437.379, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.332, "r_y0": 406.686, "r_x1": 456.651, "r_y1": 406.686, "r_x2": 456.651, "r_y2": 401.109, "r_x3": 450.332, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.285, "r_y0": 406.686, "r_x1": 469.604, "r_y1": 406.686, "r_x2": 469.604, "r_y2": 401.109, "r_x3": 463.285, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.237, "r_y0": 406.686, "r_x1": 482.557, "r_y1": 406.686, "r_x2": 482.557, "r_y2": 401.109, "r_x3": 476.237, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.19, "r_y0": 406.686, "r_x1": 495.509, "r_y1": 406.686, "r_x2": 495.509, "r_y2": 401.109, "r_x3": 489.19, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.143, "r_y0": 406.686, "r_x1": 508.462, "r_y1": 406.686, "r_x2": 508.462, "r_y2": 401.109, "r_x3": 502.143, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.095, "r_y0": 406.686, "r_x1": 521.414, "r_y1": 406.686, "r_x2": 521.414, "r_y2": 401.109, "r_x3": 515.095, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 417.172, "r_x1": 391.601, "r_y1": 417.172, "r_x2": 391.601, "r_y2": 411.594, "r_x3": 385.281, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 417.172, "r_x1": 404.843, "r_y1": 417.172, "r_x2": 404.843, "r_y2": 411.594, "r_x3": 398.523, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 417.172, "r_x1": 417.795, "r_y1": 417.172, "r_x2": 417.795, "r_y2": 411.594, "r_x3": 411.476, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 417.172, "r_x1": 443.699, "r_y1": 417.172, "r_x2": 443.699, "r_y2": 411.594, "r_x3": 437.379, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.332, "r_y0": 417.172, "r_x1": 456.651, "r_y1": 417.172, "r_x2": 456.651, "r_y2": 411.594, "r_x3": 450.332, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.285, "r_y0": 417.172, "r_x1": 469.604, "r_y1": 417.172, "r_x2": 469.604, "r_y2": 411.594, "r_x3": 463.285, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 427.203, "r_x1": 391.601, "r_y1": 427.203, "r_x2": 391.601, "r_y2": 421.626, "r_x3": 385.281, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 427.203, "r_x1": 404.843, "r_y1": 427.203, "r_x2": 404.843, "r_y2": 421.626, "r_x3": 398.523, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 427.203, "r_x1": 417.795, "r_y1": 427.203, "r_x2": 417.795, "r_y2": 421.626, "r_x3": 411.476, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.429, "r_y0": 427.203, "r_x1": 430.748, "r_y1": 427.203, "r_x2": 430.748, "r_y2": 421.626, "r_x3": 424.429, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.381, "r_y0": 427.203, "r_x1": 443.701, "r_y1": 427.203, "r_x2": 443.701, "r_y2": 421.626, "r_x3": 437.381, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.334, "r_y0": 427.203, "r_x1": 456.653, "r_y1": 427.203, "r_x2": 456.653, "r_y2": 421.626, "r_x3": 450.334, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.287, "r_y0": 427.203, "r_x1": 469.606, "r_y1": 427.203, "r_x2": 469.606, "r_y2": 421.626, "r_x3": 463.287, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.239, "r_y0": 427.203, "r_x1": 482.558, "r_y1": 427.203, "r_x2": 482.558, "r_y2": 421.626, "r_x3": 476.239, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.192, "r_y0": 427.203, "r_x1": 495.511, "r_y1": 427.203, "r_x2": 495.511, "r_y2": 421.626, "r_x3": 489.192, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.144, "r_y0": 427.203, "r_x1": 508.464, "r_y1": 427.203, "r_x2": 508.464, "r_y2": 421.626, "r_x3": 502.144, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.097, "r_y0": 427.203, "r_x1": 521.416, "r_y1": 427.203, "r_x2": 521.416, "r_y2": 421.626, "r_x3": 515.097, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.05, "r_y0": 427.203, "r_x1": 534.369, "r_y1": 427.203, "r_x2": 534.369, "r_y2": 421.626, "r_x3": 528.05, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 438.178, "r_x1": 391.601, "r_y1": 438.178, "r_x2": 391.601, "r_y2": 432.6, "r_x3": 385.281, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 438.178, "r_x1": 404.843, "r_y1": 438.178, "r_x2": 404.843, "r_y2": 432.6, "r_x3": 398.523, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 438.178, "r_x1": 417.795, "r_y1": 438.178, "r_x2": 417.795, "r_y2": 432.6, "r_x3": 411.476, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.429, "r_y0": 438.178, "r_x1": 430.748, "r_y1": 438.178, "r_x2": 430.748, "r_y2": 432.6, "r_x3": 424.429, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.381, "r_y0": 438.178, "r_x1": 443.701, "r_y1": 438.178, "r_x2": 443.701, "r_y2": 432.6, "r_x3": 437.381, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.334, "r_y0": 438.178, "r_x1": 456.653, "r_y1": 438.178, "r_x2": 456.653, "r_y2": 432.6, "r_x3": 450.334, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.287, "r_y0": 438.178, "r_x1": 469.606, "r_y1": 438.178, "r_x2": 469.606, "r_y2": 432.6, "r_x3": 463.287, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.239, "r_y0": 438.178, "r_x1": 482.558, "r_y1": 438.178, "r_x2": 482.558, "r_y2": 432.6, "r_x3": 476.239, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.192, "r_y0": 438.178, "r_x1": 495.511, "r_y1": 438.178, "r_x2": 495.511, "r_y2": 432.6, "r_x3": 489.192, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.144, "r_y0": 438.178, "r_x1": 508.464, "r_y1": 438.178, "r_x2": 508.464, "r_y2": 432.6, "r_x3": 502.144, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.097, "r_y0": 438.178, "r_x1": 521.416, "r_y1": 438.178, "r_x2": 521.416, "r_y2": 432.6, "r_x3": 515.097, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.05, "r_y0": 438.178, "r_x1": 534.369, "r_y1": 438.178, "r_x2": 534.369, "r_y2": 432.6, "r_x3": 528.05, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 395.333, "r_x1": 388.441, "r_y1": 395.333, "r_x2": 388.441, "r_y2": 389.756, "r_x3": 385.281, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 395.333, "r_x1": 401.683, "r_y1": 395.333, "r_x2": 401.683, "r_y2": 389.756, "r_x3": 398.523, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.475, "r_y0": 395.333, "r_x1": 414.635, "r_y1": 395.333, "r_x2": 414.635, "r_y2": 389.756, "r_x3": 411.475, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.427, "r_y0": 395.333, "r_x1": 427.587, "r_y1": 395.333, "r_x2": 427.587, "r_y2": 389.756, "r_x3": 424.427, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 395.333, "r_x1": 440.539, "r_y1": 395.333, "r_x2": 440.539, "r_y2": 389.756, "r_x3": 437.379, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.331, "r_y0": 395.333, "r_x1": 453.491, "r_y1": 395.333, "r_x2": 453.491, "r_y2": 389.756, "r_x3": 450.331, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.283, "r_y0": 395.333, "r_x1": 466.443, "r_y1": 395.333, "r_x2": 466.443, "r_y2": 389.756, "r_x3": 463.283, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.235, "r_y0": 395.333, "r_x1": 479.395, "r_y1": 395.333, "r_x2": 479.395, "r_y2": 389.756, "r_x3": 476.235, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.187, "r_y0": 395.333, "r_x1": 492.347, "r_y1": 395.333, "r_x2": 492.347, "r_y2": 389.756, "r_x3": 489.187, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.139, "r_y0": 395.333, "r_x1": 505.299, "r_y1": 395.333, "r_x2": 505.299, "r_y2": 389.756, "r_x3": 502.139, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.091, "r_y0": 395.333, "r_x1": 521.411, "r_y1": 395.333, "r_x2": 521.411, "r_y2": 389.756, "r_x3": 515.091, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.044, "r_y0": 395.333, "r_x1": 534.131, "r_y1": 395.333, "r_x2": 534.131, "r_y2": 389.756, "r_x3": 528.044, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 405.108, "r_x1": 391.601, "r_y1": 405.108, "r_x2": 391.601, "r_y2": 399.531, "r_x3": 385.281, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 405.108, "r_x1": 404.843, "r_y1": 405.108, "r_x2": 404.843, "r_y2": 399.531, "r_x3": 398.523, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 405.108, "r_x1": 417.795, "r_y1": 405.108, "r_x2": 417.795, "r_y2": 399.531, "r_x3": 411.476, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.427, "r_y0": 412.908, "r_x1": 430.746, "r_y1": 412.908, "r_x2": 430.746, "r_y2": 407.331, "r_x3": 424.427, "r_y3": 407.331, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.869, "r_y0": 417.128, "r_x1": 509.189, "r_y1": 417.128, "r_x2": 509.189, "r_y2": 411.55, "r_x3": 502.869, "r_y3": 411.55, "coord_origin": "TOPLEFT"}, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.354, "r_y0": 386.393, "r_x1": 430.993, "r_y1": 386.393, "r_x2": 430.993, "r_y2": 381.96, "r_x3": 384.354, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.595, "r_y0": 467.549, "r_x1": 98.849, "r_y1": 467.549, "r_x2": 98.849, "r_y2": 458.997, "r_x3": 62.595, "r_y3": 458.997, "coord_origin": "TOPLEFT"}, "text": "Figure 6:", "orig": "Figure 6:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 104.428, "r_y0": 467.549, "r_x1": 532.63, "r_y1": 467.549, "r_x2": 532.63, "r_y2": 458.997, "r_x3": 104.428, "r_y3": 458.997, "coord_origin": "TOPLEFT"}, "text": "An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "orig": "An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 501.247, "r_x1": 163.756, "r_y1": 501.247, "r_x2": 163.756, "r_y2": 491.395, "r_x3": 50.112, "r_y3": 491.395, "coord_origin": "TOPLEFT"}, "text": "5.5. Qualitative Analysis", "orig": "5.5. Qualitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 545.694, "r_x1": 118.505, "r_y1": 545.694, "r_x2": 118.505, "r_y2": 537.142, "r_x3": 62.067, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "We showcase", "orig": "We showcase", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 123.985, "r_y0": 545.694, "r_x1": 151.8, "r_y1": 545.694, "r_x2": 151.8, "r_y2": 537.142, "r_x3": 123.985, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "several", "orig": "several", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.28, "r_y0": 545.694, "r_x1": 212.074, "r_y1": 545.694, "r_x2": 212.074, "r_y2": 537.142, "r_x3": 157.28, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "visualizations", "orig": "visualizations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.553, "r_y0": 545.694, "r_x1": 229.17, "r_y1": 545.694, "r_x2": 229.17, "r_y2": 537.142, "r_x3": 217.553, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.659, "r_y0": 545.694, "r_x1": 246.833, "r_y1": 545.694, "r_x2": 246.833, "r_y2": 537.142, "r_x3": 234.659, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 252.313, "r_y0": 545.694, "r_x1": 286.365, "r_y1": 545.694, "r_x2": 286.365, "r_y2": 537.142, "r_x3": 252.313, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "different", "orig": "different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 557.649, "r_x1": 211.157, "r_y1": 557.649, "r_x2": 211.157, "r_y2": 549.097, "r_x3": 50.112, "r_y3": 549.097, "coord_origin": "TOPLEFT"}, "text": "components of our network on various", "orig": "components of our network on various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.1, "r_y0": 557.506, "r_x1": 259.175, "r_y1": 557.506, "r_x2": 259.175, "r_y2": 548.918, "r_x3": 215.1, "r_y3": 548.918, "coord_origin": "TOPLEFT"}, "text": "'complex'", "orig": "'complex'", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.12, "r_y0": 557.649, "r_x1": 286.363, "r_y1": 557.649, "r_x2": 286.363, "r_y2": 549.097, "r_x3": 263.12, "r_y3": 549.097, "coord_origin": "TOPLEFT"}, "text": "tables", "orig": "tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 569.604, "r_x1": 231.72, "r_y1": 569.604, "r_x2": 231.72, "r_y2": 561.052, "r_x3": 50.112, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "within datasets presented in this work in Fig.", "orig": "within datasets presented in this work in Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.064, "r_y0": 569.604, "r_x1": 277.03, "r_y1": 569.604, "r_x2": 277.03, "r_y2": 561.052, "r_x3": 236.064, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "5 and Fig.", "orig": "5 and Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.384, "r_y0": 569.604, "r_x1": 286.365, "r_y1": 569.604, "r_x2": 286.365, "r_y2": 561.052, "r_x3": 281.384, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 581.559, "r_x1": 286.365, "r_y1": 581.559, "r_x2": 286.365, "r_y2": 573.0070000000001, "r_x3": 50.112, "r_y3": 573.0070000000001, "coord_origin": "TOPLEFT"}, "text": "As it is shown, our model is able to predict bounding boxes", "orig": "As it is shown, our model is able to predict bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 593.514, "r_x1": 122.341, "r_y1": 593.514, "r_x2": 122.341, "r_y2": 584.962, "r_x3": 50.112, "r_y3": 584.962, "coord_origin": "TOPLEFT"}, "text": "for all table cells,", "orig": "for all table cells,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 126.107, "r_y0": 593.514, "r_x1": 228.004, "r_y1": 593.514, "r_x2": 228.004, "r_y2": 584.962, "r_x3": 126.107, "r_y3": 584.962, "coord_origin": "TOPLEFT"}, "text": "even for the empty ones.", "orig": "even for the empty ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.151, "r_y0": 593.514, "r_x1": 286.365, "r_y1": 593.514, "r_x2": 286.365, "r_y2": 584.962, "r_x3": 234.151, "r_y3": 584.962, "coord_origin": "TOPLEFT"}, "text": "Additionally,", "orig": "Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 605.47, "r_x1": 286.365, "r_y1": 605.47, "r_x2": 286.365, "r_y2": 596.918, "r_x3": 50.112, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "our post-processing techniques can extract the cell content", "orig": "our post-processing techniques can extract the cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 617.425, "r_x1": 286.365, "r_y1": 617.425, "r_x2": 286.365, "r_y2": 608.873, "r_x3": 50.112, "r_y3": 608.873, "coord_origin": "TOPLEFT"}, "text": "by matching the predicted bounding boxes to the PDF cells", "orig": "by matching the predicted bounding boxes to the PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 629.38, "r_x1": 230.873, "r_y1": 629.38, "r_x2": 230.873, "r_y2": 620.828, "r_x3": 50.112, "r_y3": 620.828, "coord_origin": "TOPLEFT"}, "text": "based on their overlap and spatial proximity.", "orig": "based on their overlap and spatial proximity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.855, "r_y0": 629.38, "r_x1": 286.365, "r_y1": 629.38, "r_x2": 286.365, "r_y2": 620.828, "r_x3": 235.855, "r_y3": 620.828, "coord_origin": "TOPLEFT"}, "text": "The left part", "orig": "The left part", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 641.335, "r_x1": 77.121, "r_y1": 641.335, "r_x2": 77.121, "r_y2": 632.783, "r_x3": 50.112, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "of Fig.", "orig": "of Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.544, "r_y0": 641.335, "r_x1": 286.365, "r_y1": 641.335, "r_x2": 286.365, "r_y2": 632.783, "r_x3": 81.544, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "5 demonstrates also the adaptability of our method", "orig": "5 demonstrates also the adaptability of our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 653.29, "r_x1": 57.863, "r_y1": 653.29, "r_x2": 57.863, "r_y2": 644.738, "r_x3": 50.112, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.436, "r_y0": 653.29, "r_x1": 119.691, "r_y1": 653.29, "r_x2": 119.691, "r_y2": 644.738, "r_x3": 62.436, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "any language,", "orig": "any language,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.782, "r_y0": 653.29, "r_x1": 133.081, "r_y1": 653.29, "r_x2": 133.081, "r_y2": 644.738, "r_x3": 124.782, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "as", "orig": "as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.653, "r_y0": 653.29, "r_x1": 143.193, "r_y1": 653.29, "r_x2": 143.193, "r_y2": 644.738, "r_x3": 137.653, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.765, "r_y0": 653.29, "r_x1": 214.854, "r_y1": 653.29, "r_x2": 214.854, "r_y2": 644.738, "r_x3": 147.765, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "can successfully", "orig": "can successfully", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.426, "r_y0": 653.29, "r_x1": 246.385, "r_y1": 653.29, "r_x2": 246.385, "r_y2": 644.738, "r_x3": 219.426, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "extract", "orig": "extract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.958, "r_y0": 653.29, "r_x1": 286.365, "r_y1": 653.29, "r_x2": 286.365, "r_y2": 644.738, "r_x3": 250.958, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "Japanese", "orig": "Japanese", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 665.245, "r_x1": 286.365, "r_y1": 665.245, "r_x2": 286.365, "r_y2": 656.693, "r_x3": 50.112, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "text, although the training set contains only English content.", "orig": "text, although the training set contains only English content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.201, "r_x1": 286.365, "r_y1": 677.201, "r_x2": 286.365, "r_y2": 668.649, "r_x3": 50.112, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "We provide more visualizations including the intermediate", "orig": "We provide more visualizations including the intermediate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 195.217, "r_y1": 689.156, "r_x2": 195.217, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "steps in the supplementary material.", "orig": "steps in the supplementary material.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 203, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.431, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 199.431, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "Overall these illustra-", "orig": "Overall these illustra-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 204, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "tions justify the versatility of our method across a diverse", "orig": "tions justify the versatility of our method across a diverse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 205, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 226.888, "r_y1": 713.066, "r_x2": 226.888, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "range of table appearances and content type.", "orig": "range of table appearances and content type.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 206, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 501.457, "r_x1": 460.848, "r_y1": 501.457, "r_x2": 460.848, "r_y2": 490.709, "r_x3": 308.862, "r_y3": 490.709, "coord_origin": "TOPLEFT"}, "text": "6. Future Work &Conclusion", "orig": "6. Future Work &Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 207, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 521.7139999999999, "r_x1": 545.115, "r_y1": 521.7139999999999, "r_x2": 545.115, "r_y2": 513.162, "r_x3": 320.817, "r_y3": 513.162, "coord_origin": "TOPLEFT"}, "text": "In this paper, we presented TableFormer an end-to-end", "orig": "In this paper, we presented TableFormer an end-to-end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 208, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.669, "r_x1": 545.115, "r_y1": 533.669, "r_x2": 545.115, "r_y2": 525.117, "r_x3": 308.862, "r_y3": 525.117, "coord_origin": "TOPLEFT"}, "text": "transformer based approach to predict table structures and", "orig": "transformer based approach to predict table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 209, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.624, "r_x1": 545.115, "r_y1": 545.624, "r_x2": 545.115, "r_y2": 537.072, "r_x3": 308.862, "r_y3": 537.072, "coord_origin": "TOPLEFT"}, "text": "bounding boxes of cells from an image. This approach en-", "orig": "bounding boxes of cells from an image. This approach en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 210, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 557.579, "r_x1": 545.115, "r_y1": 557.579, "r_x2": 545.115, "r_y2": 549.027, "r_x3": 308.862, "r_y3": 549.027, "coord_origin": "TOPLEFT"}, "text": "ables us to recreate the table structure, and extract the cell", "orig": "ables us to recreate the table structure, and extract the cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 211, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.534, "r_x1": 524.562, "r_y1": 569.534, "r_x2": 524.562, "r_y2": 560.982, "r_x3": 308.862, "r_y3": 560.982, "coord_origin": "TOPLEFT"}, "text": "content from PDF or OCR by using bounding boxes.", "orig": "content from PDF or OCR by using bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 212, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 529.623, "r_y0": 569.534, "r_x1": 545.115, "r_y1": 569.534, "r_x2": 545.115, "r_y2": 560.982, "r_x3": 529.623, "r_y3": 560.982, "coord_origin": "TOPLEFT"}, "text": "Ad-", "orig": "Ad-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 213, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 581.489, "r_x1": 545.115, "r_y1": 581.489, "r_x2": 545.115, "r_y2": 572.937, "r_x3": 308.862, "r_y3": 572.937, "coord_origin": "TOPLEFT"}, "text": "ditionally, it provides the versatility required in real-world", "orig": "ditionally, it provides the versatility required in real-world", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 214, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 593.4449999999999, "r_x1": 545.115, "r_y1": 593.4449999999999, "r_x2": 545.115, "r_y2": 584.893, "r_x3": 308.862, "r_y3": 584.893, "coord_origin": "TOPLEFT"}, "text": "scenarios when dealing with various types of PDF docu-", "orig": "scenarios when dealing with various types of PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 215, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.4, "r_x1": 335.153, "r_y1": 605.4, "r_x2": 335.153, "r_y2": 596.848, "r_x3": 308.862, "r_y3": 596.848, "coord_origin": "TOPLEFT"}, "text": "ments,", "orig": "ments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 216, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.656, "r_y0": 605.4, "r_x1": 400.468, "r_y1": 605.4, "r_x2": 400.468, "r_y2": 596.848, "r_x3": 339.656, "r_y3": 596.848, "coord_origin": "TOPLEFT"}, "text": "and languages.", "orig": "and languages.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 217, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.378, "r_y0": 605.4, "r_x1": 460.672, "r_y1": 605.4, "r_x2": 460.672, "r_y2": 596.848, "r_x3": 408.378, "r_y3": 596.848, "coord_origin": "TOPLEFT"}, "text": "Furthermore,", "orig": "Furthermore,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 218, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.175, "r_y0": 605.4, "r_x1": 545.115, "r_y1": 605.4, "r_x2": 545.115, "r_y2": 596.848, "r_x3": 465.175, "r_y3": 596.848, "coord_origin": "TOPLEFT"}, "text": "our method outper-", "orig": "our method outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 219, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.355, "r_x1": 495.471, "r_y1": 617.355, "r_x2": 495.471, "r_y2": 608.803, "r_x3": 308.862, "r_y3": 608.803, "coord_origin": "TOPLEFT"}, "text": "forms all state-of-the-arts with a wide margin.", "orig": "forms all state-of-the-arts with a wide margin.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 220, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.234, "r_y0": 617.355, "r_x1": 545.115, "r_y1": 617.355, "r_x2": 545.115, "r_y2": 608.803, "r_x3": 500.234, "r_y3": 608.803, "coord_origin": "TOPLEFT"}, "text": "Finally, we", "orig": "Finally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 221, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.31, "r_x1": 545.115, "r_y1": 629.31, "r_x2": 545.115, "r_y2": 620.758, "r_x3": 308.862, "r_y3": 620.758, "coord_origin": "TOPLEFT"}, "text": "introduce 'SynthTabNet' a challenging synthetically gen-", "orig": "introduce 'SynthTabNet' a challenging synthetically gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 222, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.265, "r_x1": 545.115, "r_y1": 641.265, "r_x2": 545.115, "r_y2": 632.713, "r_x3": 308.862, "r_y3": 632.713, "coord_origin": "TOPLEFT"}, "text": "erated dataset that reinforces missing characteristics from", "orig": "erated dataset that reinforces missing characteristics from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 223, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.22, "r_x1": 365.858, "r_y1": 653.22, "r_x2": 365.858, "r_y2": 644.668, "r_x3": 308.862, "r_y3": 644.668, "coord_origin": "TOPLEFT"}, "text": "other datasets.", "orig": "other datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 224, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 682.847, "r_x1": 364.406, "r_y1": 682.847, "r_x2": 364.406, "r_y2": 672.099, "r_x3": 308.862, "r_y3": 672.099, "coord_origin": "TOPLEFT"}, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 225, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.345, "r_y0": 701.901, "r_x1": 323.8, "r_y1": 701.901, "r_x2": 323.8, "r_y2": 694.204, "r_x3": 313.345, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "[1]", "orig": "[1]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 226, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 701.901, "r_x1": 545.109, "r_y1": 701.901, "r_x2": 545.109, "r_y2": 694.204, "r_x3": 328.785, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 227, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 712.86, "r_x1": 545.113, "r_y1": 712.86, "r_x2": 545.113, "r_y2": 705.163, "r_x3": 328.781, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 228, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 18, "label": "caption", "bbox": {"l": 53.812, "t": 208.54100000000005, "r": 385.934, "b": 216.02300000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.5986505746841431, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.812, "r_y0": 216.02300000000002, "r_x1": 385.934, "r_y1": 216.02300000000002, "r_x2": 385.934, "r_y2": 208.54100000000005, "r_x3": 53.812, "r_y3": 208.54100000000005, "coord_origin": "TOPLEFT"}, "text": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:", "orig": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 29, "label": "section_header", "bbox": {"l": 53.812, "t": 94.58900000000006, "r": 284.346, "b": 102.07100000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.46452972292900085, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.812, "r_y0": 102.07100000000003, "r_x1": 284.346, "r_y1": 102.07100000000003, "r_x2": 284.346, "r_y2": 94.58900000000006, "r_x3": 53.812, "r_y3": 94.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Japanese language (previously unseen by TableFormer):", "orig": "Japanese language (previously unseen by TableFormer):", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 31, "label": "section_header", "bbox": {"l": 304.831, "t": 94.58900000000006, "r": 431.091, "b": 102.07100000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.4629225730895996, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 304.831, "r_y0": 102.07100000000003, "r_x1": 431.091, "r_y1": 102.07100000000003, "r_x2": 431.091, "r_y2": 94.58900000000006, "r_x3": 304.831, "r_y3": 94.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Example table from FinTabNet:", "orig": "Example table from FinTabNet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "list_item", "bbox": {"l": 53.286, "t": 78.995, "r": 499.556, "b": 86.47699999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.541211724281311, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.286, "r_y0": 86.47699999999998, "r_x1": 499.556, "r_y1": 86.47699999999998, "r_x2": 499.556, "r_y2": 78.995, "r_x3": 53.286, "r_y3": 78.995, "coord_origin": "TOPLEFT"}, "text": "a. Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "orig": "a. Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "table", "bbox": {"l": 53.62853240966797, "t": 218.94857788085938, "r": 298.5574951171875, "b": 292.39996337890625, "coord_origin": "TOPLEFT"}, "confidence": 0.8824009299278259, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.933, "r_y0": 226.00400000000002, "r_x1": 223.873, "r_y1": 226.00400000000002, "r_x2": 223.873, "r_y2": 221.35799999999995, "r_x3": 209.933, "r_y3": 221.35799999999995, "coord_origin": "TOPLEFT"}, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.765, "r_y0": 226.00400000000002, "r_x1": 273.058, "r_y1": 226.00400000000002, "r_x2": 273.058, "r_y2": 221.35799999999995, "r_x3": 263.765, "r_y3": 221.35799999999995, "coord_origin": "TOPLEFT"}, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.25, "r_y0": 233.49, "r_x1": 114.896, "r_y1": 233.49, "r_x2": 114.896, "r_y2": 228.84400000000005, "r_x3": 110.25, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.366, "r_y0": 233.49, "r_x1": 186.983, "r_y1": 233.49, "r_x2": 186.983, "r_y2": 228.84400000000005, "r_x3": 175.366, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u30d5\u30a1\u30a4\u30eb\u6570", "orig": "\u30d5\u30a1\u30a4\u30eb\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.314, "r_y0": 233.49, "r_x1": 199.961, "r_y1": 233.49, "r_x2": 199.961, "r_y2": 228.84400000000005, "r_x3": 195.314, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.198, "r_y0": 233.49, "r_x1": 236.168, "r_y1": 233.49, "r_x2": 236.168, "r_y2": 228.84400000000005, "r_x3": 229.198, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.114, "r_y0": 233.49, "r_x1": 260.761, "r_y1": 233.49, "r_x2": 260.761, "r_y2": 228.84400000000005, "r_x3": 256.114, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.384, "r_y0": 233.49, "r_x1": 285.354, "r_y1": 233.49, "r_x2": 285.354, "r_y2": 228.84400000000005, "r_x3": 278.384, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 240.76800000000003, "r_x1": 162.713, "r_y1": 240.76800000000003, "r_x2": 162.713, "r_y2": 236.48199999999997, "r_x3": 55.531, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.397, "r_y0": 240.76800000000003, "r_x1": 189.565, "r_y1": 240.76800000000003, "r_x2": 189.565, "r_y2": 236.48199999999997, "r_x3": 184.397, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.99, "r_y0": 240.76800000000003, "r_x1": 214.158, "r_y1": 240.76800000000003, "r_x2": 214.158, "r_y2": 236.48199999999997, "r_x3": 208.99, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.875, "r_y0": 240.76800000000003, "r_x1": 237.458, "r_y1": 240.76800000000003, "r_x2": 237.458, "r_y2": 236.48199999999997, "r_x3": 234.875, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 240.76800000000003, "r_x1": 264.636, "r_y1": 240.76800000000003, "r_x2": 264.636, "r_y2": 236.48199999999997, "r_x3": 256.884, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.061, "r_y0": 240.76800000000003, "r_x1": 286.644, "r_y1": 240.76800000000003, "r_x2": 286.644, "r_y2": 236.48199999999997, "r_x3": 284.061, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 246.962, "r_x1": 139.722, "r_y1": 246.962, "r_x2": 139.722, "r_y2": 242.67600000000004, "r_x3": 55.531, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 246.962, "r_x1": 190.857, "r_y1": 246.962, "r_x2": 190.857, "r_y2": 242.67600000000004, "r_x3": 183.105, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.698, "r_y0": 246.962, "r_x1": 215.45, "r_y1": 246.962, "r_x2": 215.45, "r_y2": 242.67600000000004, "r_x3": 207.698, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.875, "r_y0": 246.962, "r_x1": 237.458, "r_y1": 246.962, "r_x2": 237.458, "r_y2": 242.67600000000004, "r_x3": 234.875, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 246.962, "r_x1": 264.636, "r_y1": 246.962, "r_x2": 264.636, "r_y2": 242.67600000000004, "r_x3": 256.884, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.061, "r_y0": 246.962, "r_x1": 286.644, "r_y1": 246.962, "r_x2": 286.644, "r_y2": 242.67600000000004, "r_x3": 284.061, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 253.62199999999996, "r_x1": 74.118, "r_y1": 253.62199999999996, "r_x2": 74.118, "r_y2": 248.976, "r_x3": 55.531, "r_y3": 248.976, "coord_origin": "TOPLEFT"}, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.698, "r_y0": 253.93100000000004, "r_x1": 103.034, "r_y1": 253.93100000000004, "r_x2": 103.034, "r_y2": 249.64499999999998, "r_x3": 92.698, "r_y3": 249.64499999999998, "coord_origin": "TOPLEFT"}, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.034, "r_y0": 253.62199999999996, "r_x1": 114.651, "r_y1": 253.62199999999996, "r_x2": 114.651, "r_y2": 248.976, "r_x3": 103.034, "r_y3": 248.976, "coord_origin": "TOPLEFT"}, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 253.15700000000004, "r_x1": 190.857, "r_y1": 253.15700000000004, "r_x2": 190.857, "r_y2": 248.87099999999998, "r_x3": 183.105, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 253.15700000000004, "r_x1": 212.865, "r_y1": 253.15700000000004, "r_x2": 212.865, "r_y2": 248.87099999999998, "r_x3": 210.282, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 253.15700000000004, "r_x1": 240.043, "r_y1": 253.15700000000004, "r_x2": 240.043, "r_y2": 248.87099999999998, "r_x3": 232.292, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 253.15700000000004, "r_x1": 264.636, "r_y1": 253.15700000000004, "r_x2": 264.636, "r_y2": 248.87099999999998, "r_x3": 256.884, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 253.15700000000004, "r_x1": 289.229, "r_y1": 253.15700000000004, "r_x2": 289.229, "r_y2": 248.87099999999998, "r_x3": 281.477, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 261.10699999999997, "r_x1": 71.794, "r_y1": 261.10699999999997, "r_x2": 71.794, "r_y2": 256.461, "r_x3": 55.531, "r_y3": 256.461, "coord_origin": "TOPLEFT"}, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.053, "r_y0": 261.41600000000005, "r_x1": 93.22, "r_y1": 261.41600000000005, "r_x2": 93.22, "r_y2": 257.13, "r_x3": 88.053, "r_y3": 257.13, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.22, "r_y0": 261.10699999999997, "r_x1": 104.837, "r_y1": 261.10699999999997, "r_x2": 104.837, "r_y2": 256.461, "r_x3": 93.22, "r_y3": 256.461, "coord_origin": "TOPLEFT"}, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.451, "r_y0": 261.41600000000005, "r_x1": 129.882, "r_y1": 261.41600000000005, "r_x2": 129.882, "r_y2": 257.13, "r_x3": 116.451, "r_y3": 257.13, "coord_origin": "TOPLEFT"}, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 260.64200000000005, "r_x1": 190.857, "r_y1": 260.64200000000005, "r_x2": 190.857, "r_y2": 256.356, "r_x3": 183.105, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 260.64200000000005, "r_x1": 212.865, "r_y1": 260.64200000000005, "r_x2": 212.865, "r_y2": 256.356, "r_x3": 210.282, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 260.64200000000005, "r_x1": 240.043, "r_y1": 260.64200000000005, "r_x2": 240.043, "r_y2": 256.356, "r_x3": 232.292, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 260.64200000000005, "r_x1": 264.636, "r_y1": 260.64200000000005, "r_x2": 264.636, "r_y2": 256.356, "r_x3": 256.884, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 260.64200000000005, "r_x1": 289.229, "r_y1": 260.64200000000005, "r_x2": 289.229, "r_y2": 256.356, "r_x3": 281.477, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 268.33399999999995, "r_x1": 57.854, "r_y1": 268.33399999999995, "r_x2": 57.854, "r_y2": 263.688, "r_x3": 55.531, "r_y3": 263.688, "coord_origin": "TOPLEFT"}, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.177, "r_y0": 268.644, "r_x1": 65.344, "r_y1": 268.644, "r_x2": 65.344, "r_y2": 264.35699999999997, "r_x3": 60.177, "r_y3": 264.35699999999997, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.344, "r_y0": 268.33399999999995, "r_x1": 90.902, "r_y1": 268.33399999999995, "r_x2": 90.902, "r_y2": 263.688, "r_x3": 65.344, "r_y3": 263.688, "coord_origin": "TOPLEFT"}, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.451, "r_y0": 268.644, "r_x1": 129.882, "r_y1": 268.644, "r_x2": 129.882, "r_y2": 264.35699999999997, "r_x3": 116.451, "r_y3": 264.35699999999997, "coord_origin": "TOPLEFT"}, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 267.869, "r_x1": 190.857, "r_y1": 267.869, "r_x2": 190.857, "r_y2": 263.58299999999997, "r_x3": 183.105, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 267.869, "r_x1": 212.865, "r_y1": 267.869, "r_x2": 212.865, "r_y2": 263.58299999999997, "r_x3": 210.282, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 267.869, "r_x1": 240.043, "r_y1": 267.869, "r_x2": 240.043, "r_y2": 263.58299999999997, "r_x3": 232.292, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 267.869, "r_x1": 264.636, "r_y1": 267.869, "r_x2": 264.636, "r_y2": 263.58299999999997, "r_x3": 256.884, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 267.869, "r_x1": 289.229, "r_y1": 267.869, "r_x2": 289.229, "r_y2": 263.58299999999997, "r_x3": 281.477, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 275.562, "r_x1": 78.765, "r_y1": 275.562, "r_x2": 78.765, "r_y2": 270.91600000000005, "r_x3": 55.531, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.99, "r_y0": 275.871, "r_x1": 109.742, "r_y1": 275.871, "r_x2": 109.742, "r_y2": 271.58500000000004, "r_x3": 101.99, "r_y3": 271.58500000000004, "coord_origin": "TOPLEFT"}, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 109.742, "r_y0": 275.562, "r_x1": 112.065, "r_y1": 275.562, "r_x2": 112.065, "r_y2": 270.91600000000005, "r_x3": 109.742, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 114.388, "r_y0": 275.871, "r_x1": 122.139, "r_y1": 275.871, "r_x2": 122.139, "r_y2": 271.58500000000004, "r_x3": 114.388, "r_y3": 271.58500000000004, "coord_origin": "TOPLEFT"}, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.14, "r_y0": 275.562, "r_x1": 124.463, "r_y1": 275.562, "r_x2": 124.463, "r_y2": 270.91600000000005, "r_x3": 122.14, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.397, "r_y0": 275.096, "r_x1": 189.565, "r_y1": 275.096, "r_x2": 189.565, "r_y2": 270.80999999999995, "r_x3": 184.397, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 275.096, "r_x1": 212.865, "r_y1": 275.096, "r_x2": 212.865, "r_y2": 270.80999999999995, "r_x3": 210.282, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.583, "r_y0": 275.096, "r_x1": 238.751, "r_y1": 275.096, "r_x2": 238.751, "r_y2": 270.80999999999995, "r_x3": 233.583, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 275.096, "r_x1": 264.636, "r_y1": 275.096, "r_x2": 264.636, "r_y2": 270.80999999999995, "r_x3": 256.884, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 275.096, "r_x1": 289.229, "r_y1": 275.096, "r_x2": 289.229, "r_y2": 270.80999999999995, "r_x3": 281.477, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 283.356, "r_x1": 68.686, "r_y1": 283.356, "r_x2": 68.686, "r_y2": 279.07000000000005, "r_x3": 55.531, "r_y3": 279.07000000000005, "coord_origin": "TOPLEFT"}, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 68.686, "r_y0": 283.047, "r_x1": 87.273, "r_y1": 283.047, "r_x2": 87.273, "r_y2": 278.40099999999995, "r_x3": 68.686, "r_y3": 278.40099999999995, "coord_origin": "TOPLEFT"}, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 282.323, "r_x1": 190.857, "r_y1": 282.323, "r_x2": 190.857, "r_y2": 278.03700000000003, "r_x3": 183.105, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.99, "r_y0": 282.323, "r_x1": 214.158, "r_y1": 282.323, "r_x2": 214.158, "r_y2": 278.03700000000003, "r_x3": 208.99, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.583, "r_y0": 282.323, "r_x1": 238.751, "r_y1": 282.323, "r_x2": 238.751, "r_y2": 278.03700000000003, "r_x3": 233.583, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 282.323, "r_x1": 264.636, "r_y1": 282.323, "r_x2": 264.636, "r_y2": 278.03700000000003, "r_x3": 256.884, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.769, "r_y0": 282.323, "r_x1": 287.937, "r_y1": 282.323, "r_x2": 287.937, "r_y2": 278.03700000000003, "r_x3": 282.769, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.615, "r_y0": 290.274, "r_x1": 171.938, "r_y1": 290.274, "r_x2": 171.938, "r_y2": 285.628, "r_x3": 169.615, "r_y3": 285.628, "coord_origin": "TOPLEFT"}, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 289.809, "r_x1": 190.857, "r_y1": 289.809, "r_x2": 190.857, "r_y2": 285.522, "r_x3": 183.105, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.698, "r_y0": 289.809, "r_x1": 215.45, "r_y1": 289.809, "r_x2": 215.45, "r_y2": 285.522, "r_x3": 207.698, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 289.809, "r_x1": 240.043, "r_y1": 289.809, "r_x2": 240.043, "r_y2": 285.522, "r_x3": 232.292, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.765, "r_y0": 289.809, "r_x1": 265.752, "r_y1": 289.809, "r_x2": 265.752, "r_y2": 285.522, "r_x3": 255.765, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 289.809, "r_x1": 289.229, "r_y1": 289.809, "r_x2": 289.229, "r_y2": 285.522, "r_x3": 281.477, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 55, "label": "text", "bbox": {"l": 209.933, "t": 221.35799999999995, "r": 223.873, "b": 226.00400000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.933, "r_y0": 226.00400000000002, "r_x1": 223.873, "r_y1": 226.00400000000002, "r_x2": 223.873, "r_y2": 221.35799999999995, "r_x3": 209.933, "r_y3": 221.35799999999995, "coord_origin": "TOPLEFT"}, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 263.765, "t": 221.35799999999995, "r": 273.058, "b": 226.00400000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.765, "r_y0": 226.00400000000002, "r_x1": 273.058, "r_y1": 226.00400000000002, "r_x2": 273.058, "r_y2": 221.35799999999995, "r_x3": 263.765, "r_y3": 221.35799999999995, "coord_origin": "TOPLEFT"}, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 110.25, "t": 228.84400000000005, "r": 114.896, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.25, "r_y0": 233.49, "r_x1": 114.896, "r_y1": 233.49, "r_x2": 114.896, "r_y2": 228.84400000000005, "r_x3": 110.25, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 175.366, "t": 228.84400000000005, "r": 186.983, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.366, "r_y0": 233.49, "r_x1": 186.983, "r_y1": 233.49, "r_x2": 186.983, "r_y2": 228.84400000000005, "r_x3": 175.366, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u30d5\u30a1\u30a4\u30eb\u6570", "orig": "\u30d5\u30a1\u30a4\u30eb\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 195.314, "t": 228.84400000000005, "r": 199.961, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.314, "r_y0": 233.49, "r_x1": 199.961, "r_y1": 233.49, "r_x2": 199.961, "r_y2": 228.84400000000005, "r_x3": 195.314, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 229.198, "t": 228.84400000000005, "r": 236.168, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.198, "r_y0": 233.49, "r_x1": 236.168, "r_y1": 233.49, "r_x2": 236.168, "r_y2": 228.84400000000005, "r_x3": 229.198, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 256.114, "t": 228.84400000000005, "r": 260.761, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.114, "r_y0": 233.49, "r_x1": 260.761, "r_y1": 233.49, "r_x2": 260.761, "r_y2": 228.84400000000005, "r_x3": 256.114, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 278.384, "t": 228.84400000000005, "r": 285.354, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.384, "r_y0": 233.49, "r_x1": 285.354, "r_y1": 233.49, "r_x2": 285.354, "r_y2": 228.84400000000005, "r_x3": 278.384, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 55.531, "t": 236.48199999999997, "r": 162.713, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 240.76800000000003, "r_x1": 162.713, "r_y1": 240.76800000000003, "r_x2": 162.713, "r_y2": 236.48199999999997, "r_x3": 55.531, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 184.397, "t": 236.48199999999997, "r": 189.565, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.397, "r_y0": 240.76800000000003, "r_x1": 189.565, "r_y1": 240.76800000000003, "r_x2": 189.565, "r_y2": 236.48199999999997, "r_x3": 184.397, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 208.99, "t": 236.48199999999997, "r": 214.158, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.99, "r_y0": 240.76800000000003, "r_x1": 214.158, "r_y1": 240.76800000000003, "r_x2": 214.158, "r_y2": 236.48199999999997, "r_x3": 208.99, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 234.875, "t": 236.48199999999997, "r": 237.458, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.875, "r_y0": 240.76800000000003, "r_x1": 237.458, "r_y1": 240.76800000000003, "r_x2": 237.458, "r_y2": 236.48199999999997, "r_x3": 234.875, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 256.884, "t": 236.48199999999997, "r": 264.636, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 240.76800000000003, "r_x1": 264.636, "r_y1": 240.76800000000003, "r_x2": 264.636, "r_y2": 236.48199999999997, "r_x3": 256.884, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 284.061, "t": 236.48199999999997, "r": 286.644, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.061, "r_y0": 240.76800000000003, "r_x1": 286.644, "r_y1": 240.76800000000003, "r_x2": 286.644, "r_y2": 236.48199999999997, "r_x3": 284.061, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 55.531, "t": 242.67600000000004, "r": 139.722, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 246.962, "r_x1": 139.722, "r_y1": 246.962, "r_x2": 139.722, "r_y2": 242.67600000000004, "r_x3": 55.531, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 183.105, "t": 242.67600000000004, "r": 190.857, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 246.962, "r_x1": 190.857, "r_y1": 246.962, "r_x2": 190.857, "r_y2": 242.67600000000004, "r_x3": 183.105, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 207.698, "t": 242.67600000000004, "r": 215.45, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.698, "r_y0": 246.962, "r_x1": 215.45, "r_y1": 246.962, "r_x2": 215.45, "r_y2": 242.67600000000004, "r_x3": 207.698, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 234.875, "t": 242.67600000000004, "r": 237.458, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.875, "r_y0": 246.962, "r_x1": 237.458, "r_y1": 246.962, "r_x2": 237.458, "r_y2": 242.67600000000004, "r_x3": 234.875, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 256.884, "t": 242.67600000000004, "r": 264.636, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 246.962, "r_x1": 264.636, "r_y1": 246.962, "r_x2": 264.636, "r_y2": 242.67600000000004, "r_x3": 256.884, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 284.061, "t": 242.67600000000004, "r": 286.644, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.061, "r_y0": 246.962, "r_x1": 286.644, "r_y1": 246.962, "r_x2": 286.644, "r_y2": 242.67600000000004, "r_x3": 284.061, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 55.531, "t": 248.976, "r": 74.118, "b": 253.62199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 253.62199999999996, "r_x1": 74.118, "r_y1": 253.62199999999996, "r_x2": 74.118, "r_y2": 248.976, "r_x3": 55.531, "r_y3": 248.976, "coord_origin": "TOPLEFT"}, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 92.698, "t": 249.64499999999998, "r": 103.034, "b": 253.93100000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.698, "r_y0": 253.93100000000004, "r_x1": 103.034, "r_y1": 253.93100000000004, "r_x2": 103.034, "r_y2": 249.64499999999998, "r_x3": 92.698, "r_y3": 249.64499999999998, "coord_origin": "TOPLEFT"}, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 103.034, "t": 248.976, "r": 114.651, "b": 253.62199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.034, "r_y0": 253.62199999999996, "r_x1": 114.651, "r_y1": 253.62199999999996, "r_x2": 114.651, "r_y2": 248.976, "r_x3": 103.034, "r_y3": 248.976, "coord_origin": "TOPLEFT"}, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 183.105, "t": 248.87099999999998, "r": 190.857, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 253.15700000000004, "r_x1": 190.857, "r_y1": 253.15700000000004, "r_x2": 190.857, "r_y2": 248.87099999999998, "r_x3": 183.105, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 210.282, "t": 248.87099999999998, "r": 212.865, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 253.15700000000004, "r_x1": 212.865, "r_y1": 253.15700000000004, "r_x2": 212.865, "r_y2": 248.87099999999998, "r_x3": 210.282, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 232.292, "t": 248.87099999999998, "r": 240.043, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 253.15700000000004, "r_x1": 240.043, "r_y1": 253.15700000000004, "r_x2": 240.043, "r_y2": 248.87099999999998, "r_x3": 232.292, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 256.884, "t": 248.87099999999998, "r": 264.636, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 253.15700000000004, "r_x1": 264.636, "r_y1": 253.15700000000004, "r_x2": 264.636, "r_y2": 248.87099999999998, "r_x3": 256.884, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 82, "label": "text", "bbox": {"l": 281.477, "t": 248.87099999999998, "r": 289.229, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 253.15700000000004, "r_x1": 289.229, "r_y1": 253.15700000000004, "r_x2": 289.229, "r_y2": 248.87099999999998, "r_x3": 281.477, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 83, "label": "text", "bbox": {"l": 55.531, "t": 256.461, "r": 71.794, "b": 261.10699999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 261.10699999999997, "r_x1": 71.794, "r_y1": 261.10699999999997, "r_x2": 71.794, "r_y2": 256.461, "r_x3": 55.531, "r_y3": 256.461, "coord_origin": "TOPLEFT"}, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 88.053, "t": 257.13, "r": 93.22, "b": 261.41600000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.053, "r_y0": 261.41600000000005, "r_x1": 93.22, "r_y1": 261.41600000000005, "r_x2": 93.22, "r_y2": 257.13, "r_x3": 88.053, "r_y3": 257.13, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 93.22, "t": 256.461, "r": 104.837, "b": 261.10699999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.22, "r_y0": 261.10699999999997, "r_x1": 104.837, "r_y1": 261.10699999999997, "r_x2": 104.837, "r_y2": 256.461, "r_x3": 93.22, "r_y3": 256.461, "coord_origin": "TOPLEFT"}, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 86, "label": "text", "bbox": {"l": 116.451, "t": 257.13, "r": 129.882, "b": 261.41600000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.451, "r_y0": 261.41600000000005, "r_x1": 129.882, "r_y1": 261.41600000000005, "r_x2": 129.882, "r_y2": 257.13, "r_x3": 116.451, "r_y3": 257.13, "coord_origin": "TOPLEFT"}, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 183.105, "t": 256.356, "r": 190.857, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 260.64200000000005, "r_x1": 190.857, "r_y1": 260.64200000000005, "r_x2": 190.857, "r_y2": 256.356, "r_x3": 183.105, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 88, "label": "text", "bbox": {"l": 210.282, "t": 256.356, "r": 212.865, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 260.64200000000005, "r_x1": 212.865, "r_y1": 260.64200000000005, "r_x2": 212.865, "r_y2": 256.356, "r_x3": 210.282, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 232.292, "t": 256.356, "r": 240.043, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 260.64200000000005, "r_x1": 240.043, "r_y1": 260.64200000000005, "r_x2": 240.043, "r_y2": 256.356, "r_x3": 232.292, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 256.884, "t": 256.356, "r": 264.636, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 260.64200000000005, "r_x1": 264.636, "r_y1": 260.64200000000005, "r_x2": 264.636, "r_y2": 256.356, "r_x3": 256.884, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 91, "label": "text", "bbox": {"l": 281.477, "t": 256.356, "r": 289.229, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 260.64200000000005, "r_x1": 289.229, "r_y1": 260.64200000000005, "r_x2": 289.229, "r_y2": 256.356, "r_x3": 281.477, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 92, "label": "text", "bbox": {"l": 55.531, "t": 263.688, "r": 57.854, "b": 268.33399999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 268.33399999999995, "r_x1": 57.854, "r_y1": 268.33399999999995, "r_x2": 57.854, "r_y2": 263.688, "r_x3": 55.531, "r_y3": 263.688, "coord_origin": "TOPLEFT"}, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 93, "label": "text", "bbox": {"l": 60.177, "t": 264.35699999999997, "r": 65.344, "b": 268.644, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.177, "r_y0": 268.644, "r_x1": 65.344, "r_y1": 268.644, "r_x2": 65.344, "r_y2": 264.35699999999997, "r_x3": 60.177, "r_y3": 264.35699999999997, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 94, "label": "text", "bbox": {"l": 65.344, "t": 263.688, "r": 90.902, "b": 268.33399999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.344, "r_y0": 268.33399999999995, "r_x1": 90.902, "r_y1": 268.33399999999995, "r_x2": 90.902, "r_y2": 263.688, "r_x3": 65.344, "r_y3": 263.688, "coord_origin": "TOPLEFT"}, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 95, "label": "text", "bbox": {"l": 116.451, "t": 264.35699999999997, "r": 129.882, "b": 268.644, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.451, "r_y0": 268.644, "r_x1": 129.882, "r_y1": 268.644, "r_x2": 129.882, "r_y2": 264.35699999999997, "r_x3": 116.451, "r_y3": 264.35699999999997, "coord_origin": "TOPLEFT"}, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 96, "label": "text", "bbox": {"l": 183.105, "t": 263.58299999999997, "r": 190.857, "b": 267.869, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 267.869, "r_x1": 190.857, "r_y1": 267.869, "r_x2": 190.857, "r_y2": 263.58299999999997, "r_x3": 183.105, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 97, "label": "text", "bbox": {"l": 210.282, "t": 263.58299999999997, "r": 212.865, "b": 267.869, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 267.869, "r_x1": 212.865, "r_y1": 267.869, "r_x2": 212.865, "r_y2": 263.58299999999997, "r_x3": 210.282, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 98, "label": "text", "bbox": {"l": 232.292, "t": 263.58299999999997, "r": 240.043, "b": 267.869, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 267.869, "r_x1": 240.043, "r_y1": 267.869, "r_x2": 240.043, "r_y2": 263.58299999999997, "r_x3": 232.292, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 99, "label": "text", "bbox": {"l": 256.884, "t": 263.58299999999997, "r": 264.636, "b": 267.869, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 267.869, "r_x1": 264.636, "r_y1": 267.869, "r_x2": 264.636, "r_y2": 263.58299999999997, "r_x3": 256.884, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 100, "label": "text", "bbox": {"l": 281.477, "t": 263.58299999999997, "r": 289.229, "b": 267.869, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 267.869, "r_x1": 289.229, "r_y1": 267.869, "r_x2": 289.229, "r_y2": 263.58299999999997, "r_x3": 281.477, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 101, "label": "text", "bbox": {"l": 55.531, "t": 270.91600000000005, "r": 78.765, "b": 275.562, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 275.562, "r_x1": 78.765, "r_y1": 275.562, "r_x2": 78.765, "r_y2": 270.91600000000005, "r_x3": 55.531, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 102, "label": "text", "bbox": {"l": 101.99, "t": 271.58500000000004, "r": 109.742, "b": 275.871, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.99, "r_y0": 275.871, "r_x1": 109.742, "r_y1": 275.871, "r_x2": 109.742, "r_y2": 271.58500000000004, "r_x3": 101.99, "r_y3": 271.58500000000004, "coord_origin": "TOPLEFT"}, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 103, "label": "text", "bbox": {"l": 109.742, "t": 270.91600000000005, "r": 112.065, "b": 275.562, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 109.742, "r_y0": 275.562, "r_x1": 112.065, "r_y1": 275.562, "r_x2": 112.065, "r_y2": 270.91600000000005, "r_x3": 109.742, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 104, "label": "text", "bbox": {"l": 114.388, "t": 271.58500000000004, "r": 122.139, "b": 275.871, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 114.388, "r_y0": 275.871, "r_x1": 122.139, "r_y1": 275.871, "r_x2": 122.139, "r_y2": 271.58500000000004, "r_x3": 114.388, "r_y3": 271.58500000000004, "coord_origin": "TOPLEFT"}, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 105, "label": "text", "bbox": {"l": 122.14, "t": 270.91600000000005, "r": 124.463, "b": 275.562, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.14, "r_y0": 275.562, "r_x1": 124.463, "r_y1": 275.562, "r_x2": 124.463, "r_y2": 270.91600000000005, "r_x3": 122.14, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 106, "label": "text", "bbox": {"l": 184.397, "t": 270.80999999999995, "r": 189.565, "b": 275.096, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.397, "r_y0": 275.096, "r_x1": 189.565, "r_y1": 275.096, "r_x2": 189.565, "r_y2": 270.80999999999995, "r_x3": 184.397, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 107, "label": "text", "bbox": {"l": 210.282, "t": 270.80999999999995, "r": 212.865, "b": 275.096, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 275.096, "r_x1": 212.865, "r_y1": 275.096, "r_x2": 212.865, "r_y2": 270.80999999999995, "r_x3": 210.282, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 108, "label": "text", "bbox": {"l": 233.583, "t": 270.80999999999995, "r": 238.751, "b": 275.096, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.583, "r_y0": 275.096, "r_x1": 238.751, "r_y1": 275.096, "r_x2": 238.751, "r_y2": 270.80999999999995, "r_x3": 233.583, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 109, "label": "text", "bbox": {"l": 256.884, "t": 270.80999999999995, "r": 264.636, "b": 275.096, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 275.096, "r_x1": 264.636, "r_y1": 275.096, "r_x2": 264.636, "r_y2": 270.80999999999995, "r_x3": 256.884, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 110, "label": "text", "bbox": {"l": 281.477, "t": 270.80999999999995, "r": 289.229, "b": 275.096, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 275.096, "r_x1": 289.229, "r_y1": 275.096, "r_x2": 289.229, "r_y2": 270.80999999999995, "r_x3": 281.477, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 111, "label": "text", "bbox": {"l": 55.531, "t": 279.07000000000005, "r": 68.686, "b": 283.356, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 283.356, "r_x1": 68.686, "r_y1": 283.356, "r_x2": 68.686, "r_y2": 279.07000000000005, "r_x3": 55.531, "r_y3": 279.07000000000005, "coord_origin": "TOPLEFT"}, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 112, "label": "text", "bbox": {"l": 68.686, "t": 278.40099999999995, "r": 87.273, "b": 283.047, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 68.686, "r_y0": 283.047, "r_x1": 87.273, "r_y1": 283.047, "r_x2": 87.273, "r_y2": 278.40099999999995, "r_x3": 68.686, "r_y3": 278.40099999999995, "coord_origin": "TOPLEFT"}, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 113, "label": "text", "bbox": {"l": 183.105, "t": 278.03700000000003, "r": 190.857, "b": 282.323, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 282.323, "r_x1": 190.857, "r_y1": 282.323, "r_x2": 190.857, "r_y2": 278.03700000000003, "r_x3": 183.105, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 114, "label": "text", "bbox": {"l": 208.99, "t": 278.03700000000003, "r": 214.158, "b": 282.323, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.99, "r_y0": 282.323, "r_x1": 214.158, "r_y1": 282.323, "r_x2": 214.158, "r_y2": 278.03700000000003, "r_x3": 208.99, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 115, "label": "text", "bbox": {"l": 233.583, "t": 278.03700000000003, "r": 238.751, "b": 282.323, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.583, "r_y0": 282.323, "r_x1": 238.751, "r_y1": 282.323, "r_x2": 238.751, "r_y2": 278.03700000000003, "r_x3": 233.583, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 116, "label": "text", "bbox": {"l": 256.884, "t": 278.03700000000003, "r": 264.636, "b": 282.323, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 282.323, "r_x1": 264.636, "r_y1": 282.323, "r_x2": 264.636, "r_y2": 278.03700000000003, "r_x3": 256.884, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 117, "label": "text", "bbox": {"l": 282.769, "t": 278.03700000000003, "r": 287.937, "b": 282.323, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.769, "r_y0": 282.323, "r_x1": 287.937, "r_y1": 282.323, "r_x2": 287.937, "r_y2": 278.03700000000003, "r_x3": 282.769, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 118, "label": "text", "bbox": {"l": 169.615, "t": 285.628, "r": 171.938, "b": 290.274, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.615, "r_y0": 290.274, "r_x1": 171.938, "r_y1": 290.274, "r_x2": 171.938, "r_y2": 285.628, "r_x3": 169.615, "r_y3": 285.628, "coord_origin": "TOPLEFT"}, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 119, "label": "text", "bbox": {"l": 183.105, "t": 285.522, "r": 190.857, "b": 289.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 289.809, "r_x1": 190.857, "r_y1": 289.809, "r_x2": 190.857, "r_y2": 285.522, "r_x3": 183.105, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 120, "label": "text", "bbox": {"l": 207.698, "t": 285.522, "r": 215.45, "b": 289.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.698, "r_y0": 289.809, "r_x1": 215.45, "r_y1": 289.809, "r_x2": 215.45, "r_y2": 285.522, "r_x3": 207.698, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 121, "label": "text", "bbox": {"l": 232.292, "t": 285.522, "r": 240.043, "b": 289.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 289.809, "r_x1": 240.043, "r_y1": 289.809, "r_x2": 240.043, "r_y2": 285.522, "r_x3": 232.292, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 122, "label": "text", "bbox": {"l": 255.765, "t": 285.522, "r": 265.752, "b": 289.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.765, "r_y0": 289.809, "r_x1": 265.752, "r_y1": 289.809, "r_x2": 265.752, "r_y2": 285.522, "r_x3": 255.765, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 123, "label": "text", "bbox": {"l": 281.477, "t": 285.522, "r": 289.229, "b": 289.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 289.809, "r_x1": 289.229, "r_y1": 289.809, "r_x2": 289.229, "r_y2": 285.522, "r_x3": 281.477, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 16, "label": "caption", "bbox": {"l": 380.427, "t": 292.551, "r": 549.422, "b": 298.536, "coord_origin": "TOPLEFT"}, "confidence": 0.7499915957450867, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.427, "r_y0": 298.536, "r_x1": 549.422, "r_y1": 298.536, "r_x2": 549.422, "r_y2": 292.551, "r_x3": 380.427, "r_y3": 292.551, "coord_origin": "TOPLEFT"}, "text": "Text is aligned to match original for ease of viewing", "orig": "Text is aligned to match original for ease of viewing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "table", "bbox": {"l": 304.9219970703125, "t": 218.51486206054688, "r": 550.2321166992188, "b": 287.90069580078125, "coord_origin": "TOPLEFT"}, "confidence": 0.8899767994880676, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.049, "r_y0": 226.67100000000005, "r_x1": 542.0, "r_y1": 226.67100000000005, "r_x2": 542.0, "r_y2": 221.68899999999996, "r_x3": 459.049, "r_y3": 221.68899999999996, "coord_origin": "TOPLEFT"}, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.822, "r_y0": 232.88099999999997, "r_x1": 507.226, "r_y1": 232.88099999999997, "r_x2": 507.226, "r_y2": 227.899, "r_x3": 493.822, "r_y3": 227.899, "coord_origin": "TOPLEFT"}, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.244, "r_y0": 241.79399999999998, "r_x1": 407.346, "r_y1": 241.79399999999998, "r_x2": 407.346, "r_y2": 236.812, "r_x3": 393.244, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.097, "r_y0": 226.62099999999998, "r_x1": 438.015, "r_y1": 226.62099999999998, "r_x2": 438.015, "r_y2": 221.639, "r_x3": 392.097, "r_y3": 221.639, "coord_origin": "TOPLEFT"}, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.183, "r_y0": 241.79399999999998, "r_x1": 440.988, "r_y1": 241.79399999999998, "r_x2": 440.988, "r_y2": 236.812, "r_x3": 427.183, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.383, "r_y0": 241.79399999999998, "r_x1": 482.485, "r_y1": 241.79399999999998, "r_x2": 482.485, "r_y2": 236.812, "r_x3": 468.383, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.926, "r_y0": 241.79399999999998, "r_x1": 530.73, "r_y1": 241.79399999999998, "r_x2": 530.73, "r_y2": 236.812, "r_x3": 516.926, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 249.65700000000004, "r_x1": 364.656, "r_y1": 249.65700000000004, "r_x2": 364.656, "r_y2": 244.67600000000004, "r_x3": 306.115, "r_y3": 244.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Nonvested on January 1", "orig": "Nonvested on January 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 249.96000000000004, "r_x1": 403.755, "r_y1": 249.96000000000004, "r_x2": 403.755, "r_y2": 244.97799999999995, "r_x3": 396.247, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "1.1", "orig": "1.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.818, "r_y0": 249.96000000000004, "r_x1": 437.327, "r_y1": 249.96000000000004, "r_x2": 437.327, "r_y2": 244.97799999999995, "r_x3": 429.818, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.529, "r_y0": 249.96000000000004, "r_x1": 483.55, "r_y1": 249.96000000000004, "r_x2": 483.55, "r_y2": 244.97799999999995, "r_x3": 465.529, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "90.10 $", "orig": "90.10 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.448, "r_y0": 249.96000000000004, "r_x1": 531.47, "r_y1": 249.96000000000004, "r_x2": 531.47, "r_y2": 244.97799999999995, "r_x3": 513.448, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 258.731, "r_x1": 325.627, "r_y1": 258.731, "r_x2": 325.627, "r_y2": 253.74900000000002, "r_x3": 306.115, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 258.731, "r_x1": 403.755, "r_y1": 258.731, "r_x2": 403.755, "r_y2": 253.74900000000002, "r_x3": 396.247, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.818, "r_y0": 258.731, "r_x1": 437.327, "r_y1": 258.731, "r_x2": 437.327, "r_y2": 253.74900000000002, "r_x3": 429.818, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.436, "r_y0": 258.731, "r_x1": 482.548, "r_y1": 258.731, "r_x2": 482.548, "r_y2": 253.74900000000002, "r_x3": 466.436, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 514.291, "r_y0": 258.731, "r_x1": 530.81, "r_y1": 258.731, "r_x2": 530.81, "r_y2": 253.74900000000002, "r_x3": 514.291, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 266.595, "r_x1": 322.629, "r_y1": 266.595, "r_x2": 322.629, "r_y2": 261.61300000000006, "r_x3": 306.115, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.432, "r_y0": 266.595, "r_x1": 405.536, "r_y1": 266.595, "r_x2": 405.536, "r_y2": 261.61300000000006, "r_x3": 394.432, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "(0.5)", "orig": "(0.5)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.702, "r_y0": 266.595, "r_x1": 438.806, "r_y1": 266.595, "r_x2": 438.806, "r_y2": 261.61300000000006, "r_x3": 427.702, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.555, "r_y0": 266.595, "r_x1": 482.07, "r_y1": 266.595, "r_x2": 482.07, "r_y2": 261.61300000000006, "r_x3": 468.555, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.019, "r_y0": 266.595, "r_x1": 529.534, "r_y1": 266.595, "r_x2": 529.534, "r_y2": 261.61300000000006, "r_x3": 516.019, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 274.688, "r_x1": 356.248, "r_y1": 274.688, "r_x2": 356.248, "r_y2": 269.706, "r_x3": 306.115, "r_y3": 269.706, "coord_origin": "TOPLEFT"}, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.432, "r_y0": 275.366, "r_x1": 405.536, "r_y1": 275.366, "r_x2": 405.536, "r_y2": 270.384, "r_x3": 394.432, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.028, "r_y0": 275.366, "r_x1": 436.428, "r_y1": 275.366, "r_x2": 436.428, "r_y2": 270.384, "r_x3": 431.028, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.831, "r_y0": 275.366, "r_x1": 482.35, "r_y1": 275.366, "r_x2": 482.35, "r_y2": 270.384, "r_x3": 465.831, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.019, "r_y0": 275.366, "r_x1": 529.534, "r_y1": 275.366, "r_x2": 529.534, "r_y2": 270.384, "r_x3": 516.019, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 283.532, "r_x1": 373.358, "r_y1": 283.532, "r_x2": 373.358, "r_y2": 278.55100000000004, "r_x3": 306.115, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 283.532, "r_x1": 403.755, "r_y1": 283.532, "r_x2": 403.755, "r_y2": 278.55100000000004, "r_x3": 396.247, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.516, "r_y0": 283.532, "r_x1": 437.025, "r_y1": 283.532, "r_x2": 437.025, "r_y2": 278.55100000000004, "r_x3": 429.516, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.714, "r_y0": 283.532, "r_x1": 484.74, "r_y1": 283.532, "r_x2": 484.74, "r_y2": 278.55100000000004, "r_x3": 463.714, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.995, "r_y0": 283.532, "r_x1": 534.02, "r_y1": 283.532, "r_x2": 534.02, "r_y2": 278.55100000000004, "r_x3": 512.995, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 124, "label": "text", "bbox": {"l": 459.049, "t": 221.68899999999996, "r": 542.0, "b": 226.67100000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.049, "r_y0": 226.67100000000005, "r_x1": 542.0, "r_y1": 226.67100000000005, "r_x2": 542.0, "r_y2": 221.68899999999996, "r_x3": 459.049, "r_y3": 221.68899999999996, "coord_origin": "TOPLEFT"}, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 125, "label": "text", "bbox": {"l": 493.822, "t": 227.899, "r": 507.226, "b": 232.88099999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.822, "r_y0": 232.88099999999997, "r_x1": 507.226, "r_y1": 232.88099999999997, "r_x2": 507.226, "r_y2": 227.899, "r_x3": 493.822, "r_y3": 227.899, "coord_origin": "TOPLEFT"}, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 126, "label": "text", "bbox": {"l": 393.244, "t": 236.812, "r": 407.346, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.244, "r_y0": 241.79399999999998, "r_x1": 407.346, "r_y1": 241.79399999999998, "r_x2": 407.346, "r_y2": 236.812, "r_x3": 393.244, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 127, "label": "text", "bbox": {"l": 392.097, "t": 221.639, "r": 438.015, "b": 226.62099999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.097, "r_y0": 226.62099999999998, "r_x1": 438.015, "r_y1": 226.62099999999998, "r_x2": 438.015, "r_y2": 221.639, "r_x3": 392.097, "r_y3": 221.639, "coord_origin": "TOPLEFT"}, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 128, "label": "text", "bbox": {"l": 427.183, "t": 236.812, "r": 440.988, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.183, "r_y0": 241.79399999999998, "r_x1": 440.988, "r_y1": 241.79399999999998, "r_x2": 440.988, "r_y2": 236.812, "r_x3": 427.183, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 129, "label": "text", "bbox": {"l": 468.383, "t": 236.812, "r": 482.485, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.383, "r_y0": 241.79399999999998, "r_x1": 482.485, "r_y1": 241.79399999999998, "r_x2": 482.485, "r_y2": 236.812, "r_x3": 468.383, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 130, "label": "text", "bbox": {"l": 516.926, "t": 236.812, "r": 530.73, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.926, "r_y0": 241.79399999999998, "r_x1": 530.73, "r_y1": 241.79399999999998, "r_x2": 530.73, "r_y2": 236.812, "r_x3": 516.926, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 131, "label": "text", "bbox": {"l": 306.115, "t": 244.67600000000004, "r": 364.656, "b": 249.65700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 249.65700000000004, "r_x1": 364.656, "r_y1": 249.65700000000004, "r_x2": 364.656, "r_y2": 244.67600000000004, "r_x3": 306.115, "r_y3": 244.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Nonvested on January 1", "orig": "Nonvested on January 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 132, "label": "text", "bbox": {"l": 396.247, "t": 244.97799999999995, "r": 403.755, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 249.96000000000004, "r_x1": 403.755, "r_y1": 249.96000000000004, "r_x2": 403.755, "r_y2": 244.97799999999995, "r_x3": 396.247, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "1.1", "orig": "1.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 133, "label": "text", "bbox": {"l": 429.818, "t": 244.97799999999995, "r": 437.327, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.818, "r_y0": 249.96000000000004, "r_x1": 437.327, "r_y1": 249.96000000000004, "r_x2": 437.327, "r_y2": 244.97799999999995, "r_x3": 429.818, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 134, "label": "text", "bbox": {"l": 465.529, "t": 244.97799999999995, "r": 483.55, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.529, "r_y0": 249.96000000000004, "r_x1": 483.55, "r_y1": 249.96000000000004, "r_x2": 483.55, "r_y2": 244.97799999999995, "r_x3": 465.529, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "90.10 $", "orig": "90.10 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 135, "label": "text", "bbox": {"l": 513.448, "t": 244.97799999999995, "r": 531.47, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.448, "r_y0": 249.96000000000004, "r_x1": 531.47, "r_y1": 249.96000000000004, "r_x2": 531.47, "r_y2": 244.97799999999995, "r_x3": 513.448, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 136, "label": "text", "bbox": {"l": 306.115, "t": 253.74900000000002, "r": 325.627, "b": 258.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 258.731, "r_x1": 325.627, "r_y1": 258.731, "r_x2": 325.627, "r_y2": 253.74900000000002, "r_x3": 306.115, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 137, "label": "text", "bbox": {"l": 396.247, "t": 253.74900000000002, "r": 403.755, "b": 258.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 258.731, "r_x1": 403.755, "r_y1": 258.731, "r_x2": 403.755, "r_y2": 253.74900000000002, "r_x3": 396.247, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 138, "label": "text", "bbox": {"l": 429.818, "t": 253.74900000000002, "r": 437.327, "b": 258.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.818, "r_y0": 258.731, "r_x1": 437.327, "r_y1": 258.731, "r_x2": 437.327, "r_y2": 253.74900000000002, "r_x3": 429.818, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 139, "label": "text", "bbox": {"l": 466.436, "t": 253.74900000000002, "r": 482.548, "b": 258.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.436, "r_y0": 258.731, "r_x1": 482.548, "r_y1": 258.731, "r_x2": 482.548, "r_y2": 253.74900000000002, "r_x3": 466.436, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 140, "label": "text", "bbox": {"l": 514.291, "t": 253.74900000000002, "r": 530.81, "b": 258.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 514.291, "r_y0": 258.731, "r_x1": 530.81, "r_y1": 258.731, "r_x2": 530.81, "r_y2": 253.74900000000002, "r_x3": 514.291, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 141, "label": "text", "bbox": {"l": 306.115, "t": 261.61300000000006, "r": 322.629, "b": 266.595, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 266.595, "r_x1": 322.629, "r_y1": 266.595, "r_x2": 322.629, "r_y2": 261.61300000000006, "r_x3": 306.115, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 142, "label": "text", "bbox": {"l": 394.432, "t": 261.61300000000006, "r": 405.536, "b": 266.595, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.432, "r_y0": 266.595, "r_x1": 405.536, "r_y1": 266.595, "r_x2": 405.536, "r_y2": 261.61300000000006, "r_x3": 394.432, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "(0.5)", "orig": "(0.5)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 143, "label": "text", "bbox": {"l": 427.702, "t": 261.61300000000006, "r": 438.806, "b": 266.595, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.702, "r_y0": 266.595, "r_x1": 438.806, "r_y1": 266.595, "r_x2": 438.806, "r_y2": 261.61300000000006, "r_x3": 427.702, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 144, "label": "text", "bbox": {"l": 468.555, "t": 261.61300000000006, "r": 482.07, "b": 266.595, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.555, "r_y0": 266.595, "r_x1": 482.07, "r_y1": 266.595, "r_x2": 482.07, "r_y2": 261.61300000000006, "r_x3": 468.555, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 145, "label": "text", "bbox": {"l": 516.019, "t": 261.61300000000006, "r": 529.534, "b": 266.595, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.019, "r_y0": 266.595, "r_x1": 529.534, "r_y1": 266.595, "r_x2": 529.534, "r_y2": 261.61300000000006, "r_x3": 516.019, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 146, "label": "text", "bbox": {"l": 306.115, "t": 269.706, "r": 356.248, "b": 274.688, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 274.688, "r_x1": 356.248, "r_y1": 274.688, "r_x2": 356.248, "r_y2": 269.706, "r_x3": 306.115, "r_y3": 269.706, "coord_origin": "TOPLEFT"}, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 147, "label": "text", "bbox": {"l": 394.432, "t": 270.384, "r": 405.536, "b": 275.366, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.432, "r_y0": 275.366, "r_x1": 405.536, "r_y1": 275.366, "r_x2": 405.536, "r_y2": 270.384, "r_x3": 394.432, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 148, "label": "text", "bbox": {"l": 431.028, "t": 270.384, "r": 436.428, "b": 275.366, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.028, "r_y0": 275.366, "r_x1": 436.428, "r_y1": 275.366, "r_x2": 436.428, "r_y2": 270.384, "r_x3": 431.028, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 149, "label": "text", "bbox": {"l": 465.831, "t": 270.384, "r": 482.35, "b": 275.366, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.831, "r_y0": 275.366, "r_x1": 482.35, "r_y1": 275.366, "r_x2": 482.35, "r_y2": 270.384, "r_x3": 465.831, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 150, "label": "text", "bbox": {"l": 516.019, "t": 270.384, "r": 529.534, "b": 275.366, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.019, "r_y0": 275.366, "r_x1": 529.534, "r_y1": 275.366, "r_x2": 529.534, "r_y2": 270.384, "r_x3": 516.019, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 151, "label": "text", "bbox": {"l": 306.115, "t": 278.55100000000004, "r": 373.358, "b": 283.532, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 283.532, "r_x1": 373.358, "r_y1": 283.532, "r_x2": 373.358, "r_y2": 278.55100000000004, "r_x3": 306.115, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 152, "label": "text", "bbox": {"l": 396.247, "t": 278.55100000000004, "r": 403.755, "b": 283.532, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 283.532, "r_x1": 403.755, "r_y1": 283.532, "r_x2": 403.755, "r_y2": 278.55100000000004, "r_x3": 396.247, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 153, "label": "text", "bbox": {"l": 429.516, "t": 278.55100000000004, "r": 437.025, "b": 283.532, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.516, "r_y0": 283.532, "r_x1": 437.025, "r_y1": 283.532, "r_x2": 437.025, "r_y2": 278.55100000000004, "r_x3": 429.516, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 154, "label": "text", "bbox": {"l": 463.714, "t": 278.55100000000004, "r": 484.74, "b": 283.532, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.714, "r_y0": 283.532, "r_x1": 484.74, "r_y1": 283.532, "r_x2": 484.74, "r_y2": 278.55100000000004, "r_x3": 463.714, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 155, "label": "text", "bbox": {"l": 512.995, "t": 278.55100000000004, "r": 534.02, "b": 283.532, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.995, "r_y0": 283.532, "r_x1": 534.02, "r_y1": 283.532, "r_x2": 534.02, "r_y2": 278.55100000000004, "r_x3": 512.995, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 6, "label": "caption", "bbox": {"l": 50.112, "t": 321.146, "r": 545.114, "b": 365.564, "coord_origin": "TOPLEFT"}, "confidence": 0.9140303134918213, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 329.698, "r_x1": 86.864, "r_y1": 329.698, "r_x2": 86.864, "r_y2": 321.146, "r_x3": 50.112, "r_y3": 321.146, "coord_origin": "TOPLEFT"}, "text": "Figure 5:", "orig": "Figure 5:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.918, "r_y0": 329.698, "r_x1": 545.114, "r_y1": 329.698, "r_x2": 545.114, "r_y2": 321.146, "r_x3": 93.918, "r_y3": 321.146, "coord_origin": "TOPLEFT"}, "text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 341.653, "r_x1": 545.114, "r_y1": 341.653, "r_x2": 545.114, "r_y2": 333.101, "r_x3": 50.112, "r_y3": 333.101, "coord_origin": "TOPLEFT"}, "text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 353.608, "r_x1": 545.114, "r_y1": 353.608, "r_x2": 545.114, "r_y2": 345.056, "r_x3": 50.112, "r_y3": 345.056, "coord_origin": "TOPLEFT"}, "text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 365.564, "r_x1": 139.795, "r_y1": 365.564, "r_x2": 139.795, "r_y2": 357.012, "r_x3": 50.112, "r_y3": 357.012, "coord_origin": "TOPLEFT"}, "text": "the FinTabNet dataset.", "orig": "the FinTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "picture", "bbox": {"l": 216.76925659179688, "t": 380.4906311035156, "r": 375.7829284667969, "b": 443.34698486328125, "coord_origin": "TOPLEFT"}, "confidence": 0.805853009223938, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.263, "r_y0": 386.393, "r_x1": 342.078, "r_y1": 386.393, "r_x2": 342.078, "r_y2": 381.96, "r_x3": 220.263, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 156, "label": "text", "bbox": {"l": 220.263, "t": 381.96, "r": 342.078, "b": 386.393, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.263, "r_y0": 386.393, "r_x1": 342.078, "r_y1": 386.393, "r_x2": 342.078, "r_y2": 381.96, "r_x3": 220.263, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 11, "label": "picture", "bbox": {"l": 51.736167907714844, "t": 380.48065185546875, "r": 211.83778381347656, "b": 443.6580810546875, "coord_origin": "TOPLEFT"}, "confidence": 0.8308426737785339, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.715, "r_y0": 386.393, "r_x1": 85.657, "r_y1": 386.393, "r_x2": 85.657, "r_y2": 381.96, "r_x3": 53.715, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 157, "label": "text", "bbox": {"l": 53.715, "t": 381.96, "r": 85.657, "b": 386.393, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.715, "r_y0": 386.393, "r_x1": 85.657, "r_y1": 386.393, "r_x2": 85.657, "r_y2": 381.96, "r_x3": 53.715, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 13, "label": "picture", "bbox": {"l": 383.1364440917969, "t": 381.2313232421875, "r": 542.1132202148438, "b": 442.7749328613281, "coord_origin": "TOPLEFT"}, "confidence": 0.7881615161895752, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 406.686, "r_x1": 443.699, "r_y1": 406.686, "r_x2": 443.699, "r_y2": 401.109, "r_x3": 437.379, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.332, "r_y0": 406.686, "r_x1": 456.651, "r_y1": 406.686, "r_x2": 456.651, "r_y2": 401.109, "r_x3": 450.332, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.285, "r_y0": 406.686, "r_x1": 469.604, "r_y1": 406.686, "r_x2": 469.604, "r_y2": 401.109, "r_x3": 463.285, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.237, "r_y0": 406.686, "r_x1": 482.557, "r_y1": 406.686, "r_x2": 482.557, "r_y2": 401.109, "r_x3": 476.237, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.19, "r_y0": 406.686, "r_x1": 495.509, "r_y1": 406.686, "r_x2": 495.509, "r_y2": 401.109, "r_x3": 489.19, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.143, "r_y0": 406.686, "r_x1": 508.462, "r_y1": 406.686, "r_x2": 508.462, "r_y2": 401.109, "r_x3": 502.143, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.095, "r_y0": 406.686, "r_x1": 521.414, "r_y1": 406.686, "r_x2": 521.414, "r_y2": 401.109, "r_x3": 515.095, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 417.172, "r_x1": 391.601, "r_y1": 417.172, "r_x2": 391.601, "r_y2": 411.594, "r_x3": 385.281, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 417.172, "r_x1": 404.843, "r_y1": 417.172, "r_x2": 404.843, "r_y2": 411.594, "r_x3": 398.523, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 417.172, "r_x1": 417.795, "r_y1": 417.172, "r_x2": 417.795, "r_y2": 411.594, "r_x3": 411.476, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 417.172, "r_x1": 443.699, "r_y1": 417.172, "r_x2": 443.699, "r_y2": 411.594, "r_x3": 437.379, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.332, "r_y0": 417.172, "r_x1": 456.651, "r_y1": 417.172, "r_x2": 456.651, "r_y2": 411.594, "r_x3": 450.332, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.285, "r_y0": 417.172, "r_x1": 469.604, "r_y1": 417.172, "r_x2": 469.604, "r_y2": 411.594, "r_x3": 463.285, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 427.203, "r_x1": 391.601, "r_y1": 427.203, "r_x2": 391.601, "r_y2": 421.626, "r_x3": 385.281, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 427.203, "r_x1": 404.843, "r_y1": 427.203, "r_x2": 404.843, "r_y2": 421.626, "r_x3": 398.523, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 427.203, "r_x1": 417.795, "r_y1": 427.203, "r_x2": 417.795, "r_y2": 421.626, "r_x3": 411.476, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.429, "r_y0": 427.203, "r_x1": 430.748, "r_y1": 427.203, "r_x2": 430.748, "r_y2": 421.626, "r_x3": 424.429, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.381, "r_y0": 427.203, "r_x1": 443.701, "r_y1": 427.203, "r_x2": 443.701, "r_y2": 421.626, "r_x3": 437.381, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.334, "r_y0": 427.203, "r_x1": 456.653, "r_y1": 427.203, "r_x2": 456.653, "r_y2": 421.626, "r_x3": 450.334, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.287, "r_y0": 427.203, "r_x1": 469.606, "r_y1": 427.203, "r_x2": 469.606, "r_y2": 421.626, "r_x3": 463.287, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.239, "r_y0": 427.203, "r_x1": 482.558, "r_y1": 427.203, "r_x2": 482.558, "r_y2": 421.626, "r_x3": 476.239, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.192, "r_y0": 427.203, "r_x1": 495.511, "r_y1": 427.203, "r_x2": 495.511, "r_y2": 421.626, "r_x3": 489.192, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.144, "r_y0": 427.203, "r_x1": 508.464, "r_y1": 427.203, "r_x2": 508.464, "r_y2": 421.626, "r_x3": 502.144, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.097, "r_y0": 427.203, "r_x1": 521.416, "r_y1": 427.203, "r_x2": 521.416, "r_y2": 421.626, "r_x3": 515.097, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.05, "r_y0": 427.203, "r_x1": 534.369, "r_y1": 427.203, "r_x2": 534.369, "r_y2": 421.626, "r_x3": 528.05, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 438.178, "r_x1": 391.601, "r_y1": 438.178, "r_x2": 391.601, "r_y2": 432.6, "r_x3": 385.281, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 438.178, "r_x1": 404.843, "r_y1": 438.178, "r_x2": 404.843, "r_y2": 432.6, "r_x3": 398.523, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 438.178, "r_x1": 417.795, "r_y1": 438.178, "r_x2": 417.795, "r_y2": 432.6, "r_x3": 411.476, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.429, "r_y0": 438.178, "r_x1": 430.748, "r_y1": 438.178, "r_x2": 430.748, "r_y2": 432.6, "r_x3": 424.429, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.381, "r_y0": 438.178, "r_x1": 443.701, "r_y1": 438.178, "r_x2": 443.701, "r_y2": 432.6, "r_x3": 437.381, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.334, "r_y0": 438.178, "r_x1": 456.653, "r_y1": 438.178, "r_x2": 456.653, "r_y2": 432.6, "r_x3": 450.334, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.287, "r_y0": 438.178, "r_x1": 469.606, "r_y1": 438.178, "r_x2": 469.606, "r_y2": 432.6, "r_x3": 463.287, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.239, "r_y0": 438.178, "r_x1": 482.558, "r_y1": 438.178, "r_x2": 482.558, "r_y2": 432.6, "r_x3": 476.239, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.192, "r_y0": 438.178, "r_x1": 495.511, "r_y1": 438.178, "r_x2": 495.511, "r_y2": 432.6, "r_x3": 489.192, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.144, "r_y0": 438.178, "r_x1": 508.464, "r_y1": 438.178, "r_x2": 508.464, "r_y2": 432.6, "r_x3": 502.144, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.097, "r_y0": 438.178, "r_x1": 521.416, "r_y1": 438.178, "r_x2": 521.416, "r_y2": 432.6, "r_x3": 515.097, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.05, "r_y0": 438.178, "r_x1": 534.369, "r_y1": 438.178, "r_x2": 534.369, "r_y2": 432.6, "r_x3": 528.05, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 395.333, "r_x1": 388.441, "r_y1": 395.333, "r_x2": 388.441, "r_y2": 389.756, "r_x3": 385.281, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 395.333, "r_x1": 401.683, "r_y1": 395.333, "r_x2": 401.683, "r_y2": 389.756, "r_x3": 398.523, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.475, "r_y0": 395.333, "r_x1": 414.635, "r_y1": 395.333, "r_x2": 414.635, "r_y2": 389.756, "r_x3": 411.475, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.427, "r_y0": 395.333, "r_x1": 427.587, "r_y1": 395.333, "r_x2": 427.587, "r_y2": 389.756, "r_x3": 424.427, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 395.333, "r_x1": 440.539, "r_y1": 395.333, "r_x2": 440.539, "r_y2": 389.756, "r_x3": 437.379, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.331, "r_y0": 395.333, "r_x1": 453.491, "r_y1": 395.333, "r_x2": 453.491, "r_y2": 389.756, "r_x3": 450.331, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.283, "r_y0": 395.333, "r_x1": 466.443, "r_y1": 395.333, "r_x2": 466.443, "r_y2": 389.756, "r_x3": 463.283, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.235, "r_y0": 395.333, "r_x1": 479.395, "r_y1": 395.333, "r_x2": 479.395, "r_y2": 389.756, "r_x3": 476.235, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.187, "r_y0": 395.333, "r_x1": 492.347, "r_y1": 395.333, "r_x2": 492.347, "r_y2": 389.756, "r_x3": 489.187, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.139, "r_y0": 395.333, "r_x1": 505.299, "r_y1": 395.333, "r_x2": 505.299, "r_y2": 389.756, "r_x3": 502.139, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.091, "r_y0": 395.333, "r_x1": 521.411, "r_y1": 395.333, "r_x2": 521.411, "r_y2": 389.756, "r_x3": 515.091, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.044, "r_y0": 395.333, "r_x1": 534.131, "r_y1": 395.333, "r_x2": 534.131, "r_y2": 389.756, "r_x3": 528.044, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 405.108, "r_x1": 391.601, "r_y1": 405.108, "r_x2": 391.601, "r_y2": 399.531, "r_x3": 385.281, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 405.108, "r_x1": 404.843, "r_y1": 405.108, "r_x2": 404.843, "r_y2": 399.531, "r_x3": 398.523, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 405.108, "r_x1": 417.795, "r_y1": 405.108, "r_x2": 417.795, "r_y2": 399.531, "r_x3": 411.476, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.427, "r_y0": 412.908, "r_x1": 430.746, "r_y1": 412.908, "r_x2": 430.746, "r_y2": 407.331, "r_x3": 424.427, "r_y3": 407.331, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.869, "r_y0": 417.128, "r_x1": 509.189, "r_y1": 417.128, "r_x2": 509.189, "r_y2": 411.55, "r_x3": 502.869, "r_y3": 411.55, "coord_origin": "TOPLEFT"}, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.354, "r_y0": 386.393, "r_x1": 430.993, "r_y1": 386.393, "r_x2": 430.993, "r_y2": 381.96, "r_x3": 384.354, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 158, "label": "text", "bbox": {"l": 437.379, "t": 401.109, "r": 443.699, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 406.686, "r_x1": 443.699, "r_y1": 406.686, "r_x2": 443.699, "r_y2": 401.109, "r_x3": 437.379, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 159, "label": "text", "bbox": {"l": 450.332, "t": 401.109, "r": 456.651, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.332, "r_y0": 406.686, "r_x1": 456.651, "r_y1": 406.686, "r_x2": 456.651, "r_y2": 401.109, "r_x3": 450.332, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 160, "label": "text", "bbox": {"l": 463.285, "t": 401.109, "r": 469.604, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.285, "r_y0": 406.686, "r_x1": 469.604, "r_y1": 406.686, "r_x2": 469.604, "r_y2": 401.109, "r_x3": 463.285, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 161, "label": "text", "bbox": {"l": 476.237, "t": 401.109, "r": 482.557, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.237, "r_y0": 406.686, "r_x1": 482.557, "r_y1": 406.686, "r_x2": 482.557, "r_y2": 401.109, "r_x3": 476.237, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 162, "label": "text", "bbox": {"l": 489.19, "t": 401.109, "r": 495.509, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.19, "r_y0": 406.686, "r_x1": 495.509, "r_y1": 406.686, "r_x2": 495.509, "r_y2": 401.109, "r_x3": 489.19, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 163, "label": "text", "bbox": {"l": 502.143, "t": 401.109, "r": 508.462, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.143, "r_y0": 406.686, "r_x1": 508.462, "r_y1": 406.686, "r_x2": 508.462, "r_y2": 401.109, "r_x3": 502.143, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 164, "label": "text", "bbox": {"l": 515.095, "t": 401.109, "r": 521.414, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.095, "r_y0": 406.686, "r_x1": 521.414, "r_y1": 406.686, "r_x2": 521.414, "r_y2": 401.109, "r_x3": 515.095, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 165, "label": "text", "bbox": {"l": 385.281, "t": 411.594, "r": 391.601, "b": 417.172, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 417.172, "r_x1": 391.601, "r_y1": 417.172, "r_x2": 391.601, "r_y2": 411.594, "r_x3": 385.281, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 166, "label": "text", "bbox": {"l": 398.523, "t": 411.594, "r": 404.843, "b": 417.172, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 417.172, "r_x1": 404.843, "r_y1": 417.172, "r_x2": 404.843, "r_y2": 411.594, "r_x3": 398.523, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 167, "label": "text", "bbox": {"l": 411.476, "t": 411.594, "r": 417.795, "b": 417.172, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 417.172, "r_x1": 417.795, "r_y1": 417.172, "r_x2": 417.795, "r_y2": 411.594, "r_x3": 411.476, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 168, "label": "text", "bbox": {"l": 437.379, "t": 411.594, "r": 443.699, "b": 417.172, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 417.172, "r_x1": 443.699, "r_y1": 417.172, "r_x2": 443.699, "r_y2": 411.594, "r_x3": 437.379, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 169, "label": "text", "bbox": {"l": 450.332, "t": 411.594, "r": 456.651, "b": 417.172, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.332, "r_y0": 417.172, "r_x1": 456.651, "r_y1": 417.172, "r_x2": 456.651, "r_y2": 411.594, "r_x3": 450.332, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 170, "label": "text", "bbox": {"l": 463.285, "t": 411.594, "r": 469.604, "b": 417.172, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.285, "r_y0": 417.172, "r_x1": 469.604, "r_y1": 417.172, "r_x2": 469.604, "r_y2": 411.594, "r_x3": 463.285, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 171, "label": "text", "bbox": {"l": 385.281, "t": 421.626, "r": 391.601, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 427.203, "r_x1": 391.601, "r_y1": 427.203, "r_x2": 391.601, "r_y2": 421.626, "r_x3": 385.281, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 172, "label": "text", "bbox": {"l": 398.523, "t": 421.626, "r": 404.843, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 427.203, "r_x1": 404.843, "r_y1": 427.203, "r_x2": 404.843, "r_y2": 421.626, "r_x3": 398.523, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 173, "label": "text", "bbox": {"l": 411.476, "t": 421.626, "r": 417.795, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 427.203, "r_x1": 417.795, "r_y1": 427.203, "r_x2": 417.795, "r_y2": 421.626, "r_x3": 411.476, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 174, "label": "text", "bbox": {"l": 424.429, "t": 421.626, "r": 430.748, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.429, "r_y0": 427.203, "r_x1": 430.748, "r_y1": 427.203, "r_x2": 430.748, "r_y2": 421.626, "r_x3": 424.429, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 175, "label": "text", "bbox": {"l": 437.381, "t": 421.626, "r": 443.701, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.381, "r_y0": 427.203, "r_x1": 443.701, "r_y1": 427.203, "r_x2": 443.701, "r_y2": 421.626, "r_x3": 437.381, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 176, "label": "text", "bbox": {"l": 450.334, "t": 421.626, "r": 456.653, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.334, "r_y0": 427.203, "r_x1": 456.653, "r_y1": 427.203, "r_x2": 456.653, "r_y2": 421.626, "r_x3": 450.334, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 177, "label": "text", "bbox": {"l": 463.287, "t": 421.626, "r": 469.606, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.287, "r_y0": 427.203, "r_x1": 469.606, "r_y1": 427.203, "r_x2": 469.606, "r_y2": 421.626, "r_x3": 463.287, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 178, "label": "text", "bbox": {"l": 476.239, "t": 421.626, "r": 482.558, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.239, "r_y0": 427.203, "r_x1": 482.558, "r_y1": 427.203, "r_x2": 482.558, "r_y2": 421.626, "r_x3": 476.239, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 179, "label": "text", "bbox": {"l": 489.192, "t": 421.626, "r": 495.511, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.192, "r_y0": 427.203, "r_x1": 495.511, "r_y1": 427.203, "r_x2": 495.511, "r_y2": 421.626, "r_x3": 489.192, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 180, "label": "text", "bbox": {"l": 502.144, "t": 421.626, "r": 508.464, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.144, "r_y0": 427.203, "r_x1": 508.464, "r_y1": 427.203, "r_x2": 508.464, "r_y2": 421.626, "r_x3": 502.144, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 181, "label": "text", "bbox": {"l": 515.097, "t": 421.626, "r": 521.416, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.097, "r_y0": 427.203, "r_x1": 521.416, "r_y1": 427.203, "r_x2": 521.416, "r_y2": 421.626, "r_x3": 515.097, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 182, "label": "text", "bbox": {"l": 528.05, "t": 421.626, "r": 534.369, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.05, "r_y0": 427.203, "r_x1": 534.369, "r_y1": 427.203, "r_x2": 534.369, "r_y2": 421.626, "r_x3": 528.05, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 183, "label": "text", "bbox": {"l": 385.281, "t": 432.6, "r": 391.601, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 438.178, "r_x1": 391.601, "r_y1": 438.178, "r_x2": 391.601, "r_y2": 432.6, "r_x3": 385.281, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 184, "label": "text", "bbox": {"l": 398.523, "t": 432.6, "r": 404.843, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 438.178, "r_x1": 404.843, "r_y1": 438.178, "r_x2": 404.843, "r_y2": 432.6, "r_x3": 398.523, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 185, "label": "text", "bbox": {"l": 411.476, "t": 432.6, "r": 417.795, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 438.178, "r_x1": 417.795, "r_y1": 438.178, "r_x2": 417.795, "r_y2": 432.6, "r_x3": 411.476, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 186, "label": "text", "bbox": {"l": 424.429, "t": 432.6, "r": 430.748, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.429, "r_y0": 438.178, "r_x1": 430.748, "r_y1": 438.178, "r_x2": 430.748, "r_y2": 432.6, "r_x3": 424.429, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 187, "label": "text", "bbox": {"l": 437.381, "t": 432.6, "r": 443.701, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.381, "r_y0": 438.178, "r_x1": 443.701, "r_y1": 438.178, "r_x2": 443.701, "r_y2": 432.6, "r_x3": 437.381, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 188, "label": "text", "bbox": {"l": 450.334, "t": 432.6, "r": 456.653, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.334, "r_y0": 438.178, "r_x1": 456.653, "r_y1": 438.178, "r_x2": 456.653, "r_y2": 432.6, "r_x3": 450.334, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 189, "label": "text", "bbox": {"l": 463.287, "t": 432.6, "r": 469.606, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.287, "r_y0": 438.178, "r_x1": 469.606, "r_y1": 438.178, "r_x2": 469.606, "r_y2": 432.6, "r_x3": 463.287, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 190, "label": "text", "bbox": {"l": 476.239, "t": 432.6, "r": 482.558, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.239, "r_y0": 438.178, "r_x1": 482.558, "r_y1": 438.178, "r_x2": 482.558, "r_y2": 432.6, "r_x3": 476.239, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 191, "label": "text", "bbox": {"l": 489.192, "t": 432.6, "r": 495.511, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.192, "r_y0": 438.178, "r_x1": 495.511, "r_y1": 438.178, "r_x2": 495.511, "r_y2": 432.6, "r_x3": 489.192, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 192, "label": "text", "bbox": {"l": 502.144, "t": 432.6, "r": 508.464, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.144, "r_y0": 438.178, "r_x1": 508.464, "r_y1": 438.178, "r_x2": 508.464, "r_y2": 432.6, "r_x3": 502.144, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 193, "label": "text", "bbox": {"l": 515.097, "t": 432.6, "r": 521.416, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.097, "r_y0": 438.178, "r_x1": 521.416, "r_y1": 438.178, "r_x2": 521.416, "r_y2": 432.6, "r_x3": 515.097, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 194, "label": "text", "bbox": {"l": 528.05, "t": 432.6, "r": 534.369, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.05, "r_y0": 438.178, "r_x1": 534.369, "r_y1": 438.178, "r_x2": 534.369, "r_y2": 432.6, "r_x3": 528.05, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 195, "label": "text", "bbox": {"l": 385.281, "t": 389.756, "r": 388.441, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 395.333, "r_x1": 388.441, "r_y1": 395.333, "r_x2": 388.441, "r_y2": 389.756, "r_x3": 385.281, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 196, "label": "text", "bbox": {"l": 398.523, "t": 389.756, "r": 401.683, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 395.333, "r_x1": 401.683, "r_y1": 395.333, "r_x2": 401.683, "r_y2": 389.756, "r_x3": 398.523, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 197, "label": "text", "bbox": {"l": 411.475, "t": 389.756, "r": 414.635, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.475, "r_y0": 395.333, "r_x1": 414.635, "r_y1": 395.333, "r_x2": 414.635, "r_y2": 389.756, "r_x3": 411.475, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 198, "label": "text", "bbox": {"l": 424.427, "t": 389.756, "r": 427.587, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.427, "r_y0": 395.333, "r_x1": 427.587, "r_y1": 395.333, "r_x2": 427.587, "r_y2": 389.756, "r_x3": 424.427, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 199, "label": "text", "bbox": {"l": 437.379, "t": 389.756, "r": 440.539, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 395.333, "r_x1": 440.539, "r_y1": 395.333, "r_x2": 440.539, "r_y2": 389.756, "r_x3": 437.379, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 200, "label": "text", "bbox": {"l": 450.331, "t": 389.756, "r": 453.491, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.331, "r_y0": 395.333, "r_x1": 453.491, "r_y1": 395.333, "r_x2": 453.491, "r_y2": 389.756, "r_x3": 450.331, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 201, "label": "text", "bbox": {"l": 463.283, "t": 389.756, "r": 466.443, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.283, "r_y0": 395.333, "r_x1": 466.443, "r_y1": 395.333, "r_x2": 466.443, "r_y2": 389.756, "r_x3": 463.283, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 202, "label": "text", "bbox": {"l": 476.235, "t": 389.756, "r": 479.395, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.235, "r_y0": 395.333, "r_x1": 479.395, "r_y1": 395.333, "r_x2": 479.395, "r_y2": 389.756, "r_x3": 476.235, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 203, "label": "text", "bbox": {"l": 489.187, "t": 389.756, "r": 492.347, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.187, "r_y0": 395.333, "r_x1": 492.347, "r_y1": 395.333, "r_x2": 492.347, "r_y2": 389.756, "r_x3": 489.187, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 204, "label": "text", "bbox": {"l": 502.139, "t": 389.756, "r": 505.299, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.139, "r_y0": 395.333, "r_x1": 505.299, "r_y1": 395.333, "r_x2": 505.299, "r_y2": 389.756, "r_x3": 502.139, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 205, "label": "text", "bbox": {"l": 515.091, "t": 389.756, "r": 521.411, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.091, "r_y0": 395.333, "r_x1": 521.411, "r_y1": 395.333, "r_x2": 521.411, "r_y2": 389.756, "r_x3": 515.091, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 206, "label": "text", "bbox": {"l": 528.044, "t": 389.756, "r": 534.131, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.044, "r_y0": 395.333, "r_x1": 534.131, "r_y1": 395.333, "r_x2": 534.131, "r_y2": 389.756, "r_x3": 528.044, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 207, "label": "text", "bbox": {"l": 385.281, "t": 399.531, "r": 391.601, "b": 405.108, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 405.108, "r_x1": 391.601, "r_y1": 405.108, "r_x2": 391.601, "r_y2": 399.531, "r_x3": 385.281, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 208, "label": "text", "bbox": {"l": 398.523, "t": 399.531, "r": 404.843, "b": 405.108, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 405.108, "r_x1": 404.843, "r_y1": 405.108, "r_x2": 404.843, "r_y2": 399.531, "r_x3": 398.523, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 209, "label": "text", "bbox": {"l": 411.476, "t": 399.531, "r": 417.795, "b": 405.108, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 405.108, "r_x1": 417.795, "r_y1": 405.108, "r_x2": 417.795, "r_y2": 399.531, "r_x3": 411.476, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 210, "label": "text", "bbox": {"l": 424.427, "t": 407.331, "r": 430.746, "b": 412.908, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.427, "r_y0": 412.908, "r_x1": 430.746, "r_y1": 412.908, "r_x2": 430.746, "r_y2": 407.331, "r_x3": 424.427, "r_y3": 407.331, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 211, "label": "text", "bbox": {"l": 502.869, "t": 411.55, "r": 509.189, "b": 417.128, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.869, "r_y0": 417.128, "r_x1": 509.189, "r_y1": 417.128, "r_x2": 509.189, "r_y2": 411.55, "r_x3": 502.869, "r_y3": 411.55, "coord_origin": "TOPLEFT"}, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 212, "label": "text", "bbox": {"l": 384.354, "t": 381.96, "r": 430.993, "b": 386.393, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.354, "r_y0": 386.393, "r_x1": 430.993, "r_y1": 386.393, "r_x2": 430.993, "r_y2": 381.96, "r_x3": 384.354, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 5, "label": "caption", "bbox": {"l": 62.595, "t": 458.997, "r": 532.63, "b": 467.549, "coord_origin": "TOPLEFT"}, "confidence": 0.9153602719306946, "cells": [{"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.595, "r_y0": 467.549, "r_x1": 98.849, "r_y1": 467.549, "r_x2": 98.849, "r_y2": 458.997, "r_x3": 62.595, "r_y3": 458.997, "coord_origin": "TOPLEFT"}, "text": "Figure 6:", "orig": "Figure 6:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 104.428, "r_y0": 467.549, "r_x1": 532.63, "r_y1": 467.549, "r_x2": 532.63, "r_y2": 458.997, "r_x3": 104.428, "r_y3": 458.997, "coord_origin": "TOPLEFT"}, "text": "An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "orig": "An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "section_header", "bbox": {"l": 50.112, "t": 491.395, "r": 163.756, "b": 501.247, "coord_origin": "TOPLEFT"}, "confidence": 0.9561247229576111, "cells": [{"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 501.247, "r_x1": 163.756, "r_y1": 501.247, "r_x2": 163.756, "r_y2": 491.395, "r_x3": 50.112, "r_y3": 491.395, "coord_origin": "TOPLEFT"}, "text": "5.5. Qualitative Analysis", "orig": "5.5. Qualitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 50.112, "t": 537.142, "r": 286.365, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9852361679077148, "cells": [{"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 545.694, "r_x1": 118.505, "r_y1": 545.694, "r_x2": 118.505, "r_y2": 537.142, "r_x3": 62.067, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "We showcase", "orig": "We showcase", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 123.985, "r_y0": 545.694, "r_x1": 151.8, "r_y1": 545.694, "r_x2": 151.8, "r_y2": 537.142, "r_x3": 123.985, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "several", "orig": "several", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.28, "r_y0": 545.694, "r_x1": 212.074, "r_y1": 545.694, "r_x2": 212.074, "r_y2": 537.142, "r_x3": 157.28, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "visualizations", "orig": "visualizations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.553, "r_y0": 545.694, "r_x1": 229.17, "r_y1": 545.694, "r_x2": 229.17, "r_y2": 537.142, "r_x3": 217.553, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.659, "r_y0": 545.694, "r_x1": 246.833, "r_y1": 545.694, "r_x2": 246.833, "r_y2": 537.142, "r_x3": 234.659, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 252.313, "r_y0": 545.694, "r_x1": 286.365, "r_y1": 545.694, "r_x2": 286.365, "r_y2": 537.142, "r_x3": 252.313, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "different", "orig": "different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 557.649, "r_x1": 211.157, "r_y1": 557.649, "r_x2": 211.157, "r_y2": 549.097, "r_x3": 50.112, "r_y3": 549.097, "coord_origin": "TOPLEFT"}, "text": "components of our network on various", "orig": "components of our network on various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.1, "r_y0": 557.506, "r_x1": 259.175, "r_y1": 557.506, "r_x2": 259.175, "r_y2": 548.918, "r_x3": 215.1, "r_y3": 548.918, "coord_origin": "TOPLEFT"}, "text": "'complex'", "orig": "'complex'", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.12, "r_y0": 557.649, "r_x1": 286.363, "r_y1": 557.649, "r_x2": 286.363, "r_y2": 549.097, "r_x3": 263.12, "r_y3": 549.097, "coord_origin": "TOPLEFT"}, "text": "tables", "orig": "tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 569.604, "r_x1": 231.72, "r_y1": 569.604, "r_x2": 231.72, "r_y2": 561.052, "r_x3": 50.112, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "within datasets presented in this work in Fig.", "orig": "within datasets presented in this work in Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.064, "r_y0": 569.604, "r_x1": 277.03, "r_y1": 569.604, "r_x2": 277.03, "r_y2": 561.052, "r_x3": 236.064, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "5 and Fig.", "orig": "5 and Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.384, "r_y0": 569.604, "r_x1": 286.365, "r_y1": 569.604, "r_x2": 286.365, "r_y2": 561.052, "r_x3": 281.384, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 581.559, "r_x1": 286.365, "r_y1": 581.559, "r_x2": 286.365, "r_y2": 573.0070000000001, "r_x3": 50.112, "r_y3": 573.0070000000001, "coord_origin": "TOPLEFT"}, "text": "As it is shown, our model is able to predict bounding boxes", "orig": "As it is shown, our model is able to predict bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 593.514, "r_x1": 122.341, "r_y1": 593.514, "r_x2": 122.341, "r_y2": 584.962, "r_x3": 50.112, "r_y3": 584.962, "coord_origin": "TOPLEFT"}, "text": "for all table cells,", "orig": "for all table cells,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 126.107, "r_y0": 593.514, "r_x1": 228.004, "r_y1": 593.514, "r_x2": 228.004, "r_y2": 584.962, "r_x3": 126.107, "r_y3": 584.962, "coord_origin": "TOPLEFT"}, "text": "even for the empty ones.", "orig": "even for the empty ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.151, "r_y0": 593.514, "r_x1": 286.365, "r_y1": 593.514, "r_x2": 286.365, "r_y2": 584.962, "r_x3": 234.151, "r_y3": 584.962, "coord_origin": "TOPLEFT"}, "text": "Additionally,", "orig": "Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 605.47, "r_x1": 286.365, "r_y1": 605.47, "r_x2": 286.365, "r_y2": 596.918, "r_x3": 50.112, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "our post-processing techniques can extract the cell content", "orig": "our post-processing techniques can extract the cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 617.425, "r_x1": 286.365, "r_y1": 617.425, "r_x2": 286.365, "r_y2": 608.873, "r_x3": 50.112, "r_y3": 608.873, "coord_origin": "TOPLEFT"}, "text": "by matching the predicted bounding boxes to the PDF cells", "orig": "by matching the predicted bounding boxes to the PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 629.38, "r_x1": 230.873, "r_y1": 629.38, "r_x2": 230.873, "r_y2": 620.828, "r_x3": 50.112, "r_y3": 620.828, "coord_origin": "TOPLEFT"}, "text": "based on their overlap and spatial proximity.", "orig": "based on their overlap and spatial proximity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.855, "r_y0": 629.38, "r_x1": 286.365, "r_y1": 629.38, "r_x2": 286.365, "r_y2": 620.828, "r_x3": 235.855, "r_y3": 620.828, "coord_origin": "TOPLEFT"}, "text": "The left part", "orig": "The left part", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 641.335, "r_x1": 77.121, "r_y1": 641.335, "r_x2": 77.121, "r_y2": 632.783, "r_x3": 50.112, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "of Fig.", "orig": "of Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.544, "r_y0": 641.335, "r_x1": 286.365, "r_y1": 641.335, "r_x2": 286.365, "r_y2": 632.783, "r_x3": 81.544, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "5 demonstrates also the adaptability of our method", "orig": "5 demonstrates also the adaptability of our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 653.29, "r_x1": 57.863, "r_y1": 653.29, "r_x2": 57.863, "r_y2": 644.738, "r_x3": 50.112, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.436, "r_y0": 653.29, "r_x1": 119.691, "r_y1": 653.29, "r_x2": 119.691, "r_y2": 644.738, "r_x3": 62.436, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "any language,", "orig": "any language,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.782, "r_y0": 653.29, "r_x1": 133.081, "r_y1": 653.29, "r_x2": 133.081, "r_y2": 644.738, "r_x3": 124.782, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "as", "orig": "as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.653, "r_y0": 653.29, "r_x1": 143.193, "r_y1": 653.29, "r_x2": 143.193, "r_y2": 644.738, "r_x3": 137.653, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.765, "r_y0": 653.29, "r_x1": 214.854, "r_y1": 653.29, "r_x2": 214.854, "r_y2": 644.738, "r_x3": 147.765, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "can successfully", "orig": "can successfully", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.426, "r_y0": 653.29, "r_x1": 246.385, "r_y1": 653.29, "r_x2": 246.385, "r_y2": 644.738, "r_x3": 219.426, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "extract", "orig": "extract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.958, "r_y0": 653.29, "r_x1": 286.365, "r_y1": 653.29, "r_x2": 286.365, "r_y2": 644.738, "r_x3": 250.958, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "Japanese", "orig": "Japanese", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 665.245, "r_x1": 286.365, "r_y1": 665.245, "r_x2": 286.365, "r_y2": 656.693, "r_x3": 50.112, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "text, although the training set contains only English content.", "orig": "text, although the training set contains only English content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.201, "r_x1": 286.365, "r_y1": 677.201, "r_x2": 286.365, "r_y2": 668.649, "r_x3": 50.112, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "We provide more visualizations including the intermediate", "orig": "We provide more visualizations including the intermediate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 195.217, "r_y1": 689.156, "r_x2": 195.217, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "steps in the supplementary material.", "orig": "steps in the supplementary material.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 203, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.431, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 199.431, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "Overall these illustra-", "orig": "Overall these illustra-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 204, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "tions justify the versatility of our method across a diverse", "orig": "tions justify the versatility of our method across a diverse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 205, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 226.888, "r_y1": 713.066, "r_x2": 226.888, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "range of table appearances and content type.", "orig": "range of table appearances and content type.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "section_header", "bbox": {"l": 308.862, "t": 490.709, "r": 460.848, "b": 501.457, "coord_origin": "TOPLEFT"}, "confidence": 0.9436525702476501, "cells": [{"index": 206, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 501.457, "r_x1": 460.848, "r_y1": 501.457, "r_x2": 460.848, "r_y2": 490.709, "r_x3": 308.862, "r_y3": 490.709, "coord_origin": "TOPLEFT"}, "text": "6. Future Work &Conclusion", "orig": "6. Future Work &Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 308.862, "t": 513.162, "r": 545.115, "b": 653.22, "coord_origin": "TOPLEFT"}, "confidence": 0.9875594973564148, "cells": [{"index": 207, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 521.7139999999999, "r_x1": 545.115, "r_y1": 521.7139999999999, "r_x2": 545.115, "r_y2": 513.162, "r_x3": 320.817, "r_y3": 513.162, "coord_origin": "TOPLEFT"}, "text": "In this paper, we presented TableFormer an end-to-end", "orig": "In this paper, we presented TableFormer an end-to-end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 208, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.669, "r_x1": 545.115, "r_y1": 533.669, "r_x2": 545.115, "r_y2": 525.117, "r_x3": 308.862, "r_y3": 525.117, "coord_origin": "TOPLEFT"}, "text": "transformer based approach to predict table structures and", "orig": "transformer based approach to predict table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 209, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.624, "r_x1": 545.115, "r_y1": 545.624, "r_x2": 545.115, "r_y2": 537.072, "r_x3": 308.862, "r_y3": 537.072, "coord_origin": "TOPLEFT"}, "text": "bounding boxes of cells from an image. This approach en-", "orig": "bounding boxes of cells from an image. This approach en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 210, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 557.579, "r_x1": 545.115, "r_y1": 557.579, "r_x2": 545.115, "r_y2": 549.027, "r_x3": 308.862, "r_y3": 549.027, "coord_origin": "TOPLEFT"}, "text": "ables us to recreate the table structure, and extract the cell", "orig": "ables us to recreate the table structure, and extract the cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 211, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.534, "r_x1": 524.562, "r_y1": 569.534, "r_x2": 524.562, "r_y2": 560.982, "r_x3": 308.862, "r_y3": 560.982, "coord_origin": "TOPLEFT"}, "text": "content from PDF or OCR by using bounding boxes.", "orig": "content from PDF or OCR by using bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 212, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 529.623, "r_y0": 569.534, "r_x1": 545.115, "r_y1": 569.534, "r_x2": 545.115, "r_y2": 560.982, "r_x3": 529.623, "r_y3": 560.982, "coord_origin": "TOPLEFT"}, "text": "Ad-", "orig": "Ad-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 213, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 581.489, "r_x1": 545.115, "r_y1": 581.489, "r_x2": 545.115, "r_y2": 572.937, "r_x3": 308.862, "r_y3": 572.937, "coord_origin": "TOPLEFT"}, "text": "ditionally, it provides the versatility required in real-world", "orig": "ditionally, it provides the versatility required in real-world", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 214, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 593.4449999999999, "r_x1": 545.115, "r_y1": 593.4449999999999, "r_x2": 545.115, "r_y2": 584.893, "r_x3": 308.862, "r_y3": 584.893, "coord_origin": "TOPLEFT"}, "text": "scenarios when dealing with various types of PDF docu-", "orig": "scenarios when dealing with various types of PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 215, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.4, "r_x1": 335.153, "r_y1": 605.4, "r_x2": 335.153, "r_y2": 596.848, "r_x3": 308.862, "r_y3": 596.848, "coord_origin": "TOPLEFT"}, "text": "ments,", "orig": "ments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 216, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.656, "r_y0": 605.4, "r_x1": 400.468, "r_y1": 605.4, "r_x2": 400.468, "r_y2": 596.848, "r_x3": 339.656, "r_y3": 596.848, "coord_origin": "TOPLEFT"}, "text": "and languages.", "orig": "and languages.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 217, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.378, "r_y0": 605.4, "r_x1": 460.672, "r_y1": 605.4, "r_x2": 460.672, "r_y2": 596.848, "r_x3": 408.378, "r_y3": 596.848, "coord_origin": "TOPLEFT"}, "text": "Furthermore,", "orig": "Furthermore,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 218, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.175, "r_y0": 605.4, "r_x1": 545.115, "r_y1": 605.4, "r_x2": 545.115, "r_y2": 596.848, "r_x3": 465.175, "r_y3": 596.848, "coord_origin": "TOPLEFT"}, "text": "our method outper-", "orig": "our method outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 219, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.355, "r_x1": 495.471, "r_y1": 617.355, "r_x2": 495.471, "r_y2": 608.803, "r_x3": 308.862, "r_y3": 608.803, "coord_origin": "TOPLEFT"}, "text": "forms all state-of-the-arts with a wide margin.", "orig": "forms all state-of-the-arts with a wide margin.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 220, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.234, "r_y0": 617.355, "r_x1": 545.115, "r_y1": 617.355, "r_x2": 545.115, "r_y2": 608.803, "r_x3": 500.234, "r_y3": 608.803, "coord_origin": "TOPLEFT"}, "text": "Finally, we", "orig": "Finally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 221, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.31, "r_x1": 545.115, "r_y1": 629.31, "r_x2": 545.115, "r_y2": 620.758, "r_x3": 308.862, "r_y3": 620.758, "coord_origin": "TOPLEFT"}, "text": "introduce 'SynthTabNet' a challenging synthetically gen-", "orig": "introduce 'SynthTabNet' a challenging synthetically gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 222, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.265, "r_x1": 545.115, "r_y1": 641.265, "r_x2": 545.115, "r_y2": 632.713, "r_x3": 308.862, "r_y3": 632.713, "coord_origin": "TOPLEFT"}, "text": "erated dataset that reinforces missing characteristics from", "orig": "erated dataset that reinforces missing characteristics from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 223, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.22, "r_x1": 365.858, "r_y1": 653.22, "r_x2": 365.858, "r_y2": 644.668, "r_x3": 308.862, "r_y3": 644.668, "coord_origin": "TOPLEFT"}, "text": "other datasets.", "orig": "other datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "section_header", "bbox": {"l": 308.862, "t": 672.099, "r": 364.406, "b": 682.847, "coord_origin": "TOPLEFT"}, "confidence": 0.9442470073699951, "cells": [{"index": 224, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 682.847, "r_x1": 364.406, "r_y1": 682.847, "r_x2": 364.406, "r_y2": 672.099, "r_x3": 308.862, "r_y3": 672.099, "coord_origin": "TOPLEFT"}, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 10, "label": "list_item", "bbox": {"l": 313.345, "t": 694.204, "r": 545.113, "b": 712.86, "coord_origin": "TOPLEFT"}, "confidence": 0.8318753838539124, "cells": [{"index": 225, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.345, "r_y0": 701.901, "r_x1": 323.8, "r_y1": 701.901, "r_x2": 323.8, "r_y2": 694.204, "r_x3": 313.345, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "[1]", "orig": "[1]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 226, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 701.901, "r_x1": 545.109, "r_y1": 701.901, "r_x2": 545.109, "r_y2": 694.204, "r_x3": 328.785, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 227, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 712.86, "r_x1": 545.113, "r_y1": 712.86, "r_x2": 545.113, "r_y2": 705.163, "r_x3": 328.781, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8709858059883118, "cells": [{"index": 228, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "picture", "bbox": {"l": 305.5836486816406, "t": 98.65415954589844, "r": 554.8258666992188, "b": 180.6267547607422, "coord_origin": "TOPLEFT"}, "confidence": 0.7699173092842102, "cells": [], "children": []}, {"id": 14, "label": "picture", "bbox": {"l": 49.97503662109375, "t": 103.71266174316406, "r": 301.6335754394531, "b": 187.5789337158203, "coord_origin": "TOPLEFT"}, "confidence": 0.7873926162719727, "cells": [], "children": []}]}, "tablestructure": {"table_map": {"8": {"label": "table", "id": 8, "page_no": 7, "cluster": {"id": 8, "label": "table", "bbox": {"l": 53.62853240966797, "t": 218.94857788085938, "r": 298.5574951171875, "b": 292.39996337890625, "coord_origin": "TOPLEFT"}, "confidence": 0.8824009299278259, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.933, "r_y0": 226.00400000000002, "r_x1": 223.873, "r_y1": 226.00400000000002, "r_x2": 223.873, "r_y2": 221.35799999999995, "r_x3": 209.933, "r_y3": 221.35799999999995, "coord_origin": "TOPLEFT"}, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.765, "r_y0": 226.00400000000002, "r_x1": 273.058, "r_y1": 226.00400000000002, "r_x2": 273.058, "r_y2": 221.35799999999995, "r_x3": 263.765, "r_y3": 221.35799999999995, "coord_origin": "TOPLEFT"}, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.25, "r_y0": 233.49, "r_x1": 114.896, "r_y1": 233.49, "r_x2": 114.896, "r_y2": 228.84400000000005, "r_x3": 110.25, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.366, "r_y0": 233.49, "r_x1": 186.983, "r_y1": 233.49, "r_x2": 186.983, "r_y2": 228.84400000000005, "r_x3": 175.366, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u30d5\u30a1\u30a4\u30eb\u6570", "orig": "\u30d5\u30a1\u30a4\u30eb\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.314, "r_y0": 233.49, "r_x1": 199.961, "r_y1": 233.49, "r_x2": 199.961, "r_y2": 228.84400000000005, "r_x3": 195.314, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.198, "r_y0": 233.49, "r_x1": 236.168, "r_y1": 233.49, "r_x2": 236.168, "r_y2": 228.84400000000005, "r_x3": 229.198, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.114, "r_y0": 233.49, "r_x1": 260.761, "r_y1": 233.49, "r_x2": 260.761, "r_y2": 228.84400000000005, "r_x3": 256.114, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.384, "r_y0": 233.49, "r_x1": 285.354, "r_y1": 233.49, "r_x2": 285.354, "r_y2": 228.84400000000005, "r_x3": 278.384, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 240.76800000000003, "r_x1": 162.713, "r_y1": 240.76800000000003, "r_x2": 162.713, "r_y2": 236.48199999999997, "r_x3": 55.531, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.397, "r_y0": 240.76800000000003, "r_x1": 189.565, "r_y1": 240.76800000000003, "r_x2": 189.565, "r_y2": 236.48199999999997, "r_x3": 184.397, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.99, "r_y0": 240.76800000000003, "r_x1": 214.158, "r_y1": 240.76800000000003, "r_x2": 214.158, "r_y2": 236.48199999999997, "r_x3": 208.99, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.875, "r_y0": 240.76800000000003, "r_x1": 237.458, "r_y1": 240.76800000000003, "r_x2": 237.458, "r_y2": 236.48199999999997, "r_x3": 234.875, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 240.76800000000003, "r_x1": 264.636, "r_y1": 240.76800000000003, "r_x2": 264.636, "r_y2": 236.48199999999997, "r_x3": 256.884, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.061, "r_y0": 240.76800000000003, "r_x1": 286.644, "r_y1": 240.76800000000003, "r_x2": 286.644, "r_y2": 236.48199999999997, "r_x3": 284.061, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 246.962, "r_x1": 139.722, "r_y1": 246.962, "r_x2": 139.722, "r_y2": 242.67600000000004, "r_x3": 55.531, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 246.962, "r_x1": 190.857, "r_y1": 246.962, "r_x2": 190.857, "r_y2": 242.67600000000004, "r_x3": 183.105, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.698, "r_y0": 246.962, "r_x1": 215.45, "r_y1": 246.962, "r_x2": 215.45, "r_y2": 242.67600000000004, "r_x3": 207.698, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.875, "r_y0": 246.962, "r_x1": 237.458, "r_y1": 246.962, "r_x2": 237.458, "r_y2": 242.67600000000004, "r_x3": 234.875, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 246.962, "r_x1": 264.636, "r_y1": 246.962, "r_x2": 264.636, "r_y2": 242.67600000000004, "r_x3": 256.884, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.061, "r_y0": 246.962, "r_x1": 286.644, "r_y1": 246.962, "r_x2": 286.644, "r_y2": 242.67600000000004, "r_x3": 284.061, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 253.62199999999996, "r_x1": 74.118, "r_y1": 253.62199999999996, "r_x2": 74.118, "r_y2": 248.976, "r_x3": 55.531, "r_y3": 248.976, "coord_origin": "TOPLEFT"}, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.698, "r_y0": 253.93100000000004, "r_x1": 103.034, "r_y1": 253.93100000000004, "r_x2": 103.034, "r_y2": 249.64499999999998, "r_x3": 92.698, "r_y3": 249.64499999999998, "coord_origin": "TOPLEFT"}, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.034, "r_y0": 253.62199999999996, "r_x1": 114.651, "r_y1": 253.62199999999996, "r_x2": 114.651, "r_y2": 248.976, "r_x3": 103.034, "r_y3": 248.976, "coord_origin": "TOPLEFT"}, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 253.15700000000004, "r_x1": 190.857, "r_y1": 253.15700000000004, "r_x2": 190.857, "r_y2": 248.87099999999998, "r_x3": 183.105, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 253.15700000000004, "r_x1": 212.865, "r_y1": 253.15700000000004, "r_x2": 212.865, "r_y2": 248.87099999999998, "r_x3": 210.282, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 253.15700000000004, "r_x1": 240.043, "r_y1": 253.15700000000004, "r_x2": 240.043, "r_y2": 248.87099999999998, "r_x3": 232.292, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 253.15700000000004, "r_x1": 264.636, "r_y1": 253.15700000000004, "r_x2": 264.636, "r_y2": 248.87099999999998, "r_x3": 256.884, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 253.15700000000004, "r_x1": 289.229, "r_y1": 253.15700000000004, "r_x2": 289.229, "r_y2": 248.87099999999998, "r_x3": 281.477, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 261.10699999999997, "r_x1": 71.794, "r_y1": 261.10699999999997, "r_x2": 71.794, "r_y2": 256.461, "r_x3": 55.531, "r_y3": 256.461, "coord_origin": "TOPLEFT"}, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.053, "r_y0": 261.41600000000005, "r_x1": 93.22, "r_y1": 261.41600000000005, "r_x2": 93.22, "r_y2": 257.13, "r_x3": 88.053, "r_y3": 257.13, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.22, "r_y0": 261.10699999999997, "r_x1": 104.837, "r_y1": 261.10699999999997, "r_x2": 104.837, "r_y2": 256.461, "r_x3": 93.22, "r_y3": 256.461, "coord_origin": "TOPLEFT"}, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.451, "r_y0": 261.41600000000005, "r_x1": 129.882, "r_y1": 261.41600000000005, "r_x2": 129.882, "r_y2": 257.13, "r_x3": 116.451, "r_y3": 257.13, "coord_origin": "TOPLEFT"}, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 260.64200000000005, "r_x1": 190.857, "r_y1": 260.64200000000005, "r_x2": 190.857, "r_y2": 256.356, "r_x3": 183.105, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 260.64200000000005, "r_x1": 212.865, "r_y1": 260.64200000000005, "r_x2": 212.865, "r_y2": 256.356, "r_x3": 210.282, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 260.64200000000005, "r_x1": 240.043, "r_y1": 260.64200000000005, "r_x2": 240.043, "r_y2": 256.356, "r_x3": 232.292, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 260.64200000000005, "r_x1": 264.636, "r_y1": 260.64200000000005, "r_x2": 264.636, "r_y2": 256.356, "r_x3": 256.884, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 260.64200000000005, "r_x1": 289.229, "r_y1": 260.64200000000005, "r_x2": 289.229, "r_y2": 256.356, "r_x3": 281.477, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 268.33399999999995, "r_x1": 57.854, "r_y1": 268.33399999999995, "r_x2": 57.854, "r_y2": 263.688, "r_x3": 55.531, "r_y3": 263.688, "coord_origin": "TOPLEFT"}, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.177, "r_y0": 268.644, "r_x1": 65.344, "r_y1": 268.644, "r_x2": 65.344, "r_y2": 264.35699999999997, "r_x3": 60.177, "r_y3": 264.35699999999997, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.344, "r_y0": 268.33399999999995, "r_x1": 90.902, "r_y1": 268.33399999999995, "r_x2": 90.902, "r_y2": 263.688, "r_x3": 65.344, "r_y3": 263.688, "coord_origin": "TOPLEFT"}, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.451, "r_y0": 268.644, "r_x1": 129.882, "r_y1": 268.644, "r_x2": 129.882, "r_y2": 264.35699999999997, "r_x3": 116.451, "r_y3": 264.35699999999997, "coord_origin": "TOPLEFT"}, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 267.869, "r_x1": 190.857, "r_y1": 267.869, "r_x2": 190.857, "r_y2": 263.58299999999997, "r_x3": 183.105, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 267.869, "r_x1": 212.865, "r_y1": 267.869, "r_x2": 212.865, "r_y2": 263.58299999999997, "r_x3": 210.282, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 267.869, "r_x1": 240.043, "r_y1": 267.869, "r_x2": 240.043, "r_y2": 263.58299999999997, "r_x3": 232.292, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 267.869, "r_x1": 264.636, "r_y1": 267.869, "r_x2": 264.636, "r_y2": 263.58299999999997, "r_x3": 256.884, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 267.869, "r_x1": 289.229, "r_y1": 267.869, "r_x2": 289.229, "r_y2": 263.58299999999997, "r_x3": 281.477, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 275.562, "r_x1": 78.765, "r_y1": 275.562, "r_x2": 78.765, "r_y2": 270.91600000000005, "r_x3": 55.531, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.99, "r_y0": 275.871, "r_x1": 109.742, "r_y1": 275.871, "r_x2": 109.742, "r_y2": 271.58500000000004, "r_x3": 101.99, "r_y3": 271.58500000000004, "coord_origin": "TOPLEFT"}, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 109.742, "r_y0": 275.562, "r_x1": 112.065, "r_y1": 275.562, "r_x2": 112.065, "r_y2": 270.91600000000005, "r_x3": 109.742, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 114.388, "r_y0": 275.871, "r_x1": 122.139, "r_y1": 275.871, "r_x2": 122.139, "r_y2": 271.58500000000004, "r_x3": 114.388, "r_y3": 271.58500000000004, "coord_origin": "TOPLEFT"}, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.14, "r_y0": 275.562, "r_x1": 124.463, "r_y1": 275.562, "r_x2": 124.463, "r_y2": 270.91600000000005, "r_x3": 122.14, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.397, "r_y0": 275.096, "r_x1": 189.565, "r_y1": 275.096, "r_x2": 189.565, "r_y2": 270.80999999999995, "r_x3": 184.397, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 275.096, "r_x1": 212.865, "r_y1": 275.096, "r_x2": 212.865, "r_y2": 270.80999999999995, "r_x3": 210.282, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.583, "r_y0": 275.096, "r_x1": 238.751, "r_y1": 275.096, "r_x2": 238.751, "r_y2": 270.80999999999995, "r_x3": 233.583, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 275.096, "r_x1": 264.636, "r_y1": 275.096, "r_x2": 264.636, "r_y2": 270.80999999999995, "r_x3": 256.884, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 275.096, "r_x1": 289.229, "r_y1": 275.096, "r_x2": 289.229, "r_y2": 270.80999999999995, "r_x3": 281.477, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 283.356, "r_x1": 68.686, "r_y1": 283.356, "r_x2": 68.686, "r_y2": 279.07000000000005, "r_x3": 55.531, "r_y3": 279.07000000000005, "coord_origin": "TOPLEFT"}, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 68.686, "r_y0": 283.047, "r_x1": 87.273, "r_y1": 283.047, "r_x2": 87.273, "r_y2": 278.40099999999995, "r_x3": 68.686, "r_y3": 278.40099999999995, "coord_origin": "TOPLEFT"}, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 282.323, "r_x1": 190.857, "r_y1": 282.323, "r_x2": 190.857, "r_y2": 278.03700000000003, "r_x3": 183.105, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.99, "r_y0": 282.323, "r_x1": 214.158, "r_y1": 282.323, "r_x2": 214.158, "r_y2": 278.03700000000003, "r_x3": 208.99, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.583, "r_y0": 282.323, "r_x1": 238.751, "r_y1": 282.323, "r_x2": 238.751, "r_y2": 278.03700000000003, "r_x3": 233.583, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 282.323, "r_x1": 264.636, "r_y1": 282.323, "r_x2": 264.636, "r_y2": 278.03700000000003, "r_x3": 256.884, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.769, "r_y0": 282.323, "r_x1": 287.937, "r_y1": 282.323, "r_x2": 287.937, "r_y2": 278.03700000000003, "r_x3": 282.769, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.615, "r_y0": 290.274, "r_x1": 171.938, "r_y1": 290.274, "r_x2": 171.938, "r_y2": 285.628, "r_x3": 169.615, "r_y3": 285.628, "coord_origin": "TOPLEFT"}, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 289.809, "r_x1": 190.857, "r_y1": 289.809, "r_x2": 190.857, "r_y2": 285.522, "r_x3": 183.105, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.698, "r_y0": 289.809, "r_x1": 215.45, "r_y1": 289.809, "r_x2": 215.45, "r_y2": 285.522, "r_x3": 207.698, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 289.809, "r_x1": 240.043, "r_y1": 289.809, "r_x2": 240.043, "r_y2": 285.522, "r_x3": 232.292, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.765, "r_y0": 289.809, "r_x1": 265.752, "r_y1": 289.809, "r_x2": 265.752, "r_y2": 285.522, "r_x3": 255.765, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 289.809, "r_x1": 289.229, "r_y1": 289.809, "r_x2": 289.229, "r_y2": 285.522, "r_x3": 281.477, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 55, "label": "text", "bbox": {"l": 209.933, "t": 221.35799999999995, "r": 223.873, "b": 226.00400000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.933, "r_y0": 226.00400000000002, "r_x1": 223.873, "r_y1": 226.00400000000002, "r_x2": 223.873, "r_y2": 221.35799999999995, "r_x3": 209.933, "r_y3": 221.35799999999995, "coord_origin": "TOPLEFT"}, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 263.765, "t": 221.35799999999995, "r": 273.058, "b": 226.00400000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.765, "r_y0": 226.00400000000002, "r_x1": 273.058, "r_y1": 226.00400000000002, "r_x2": 273.058, "r_y2": 221.35799999999995, "r_x3": 263.765, "r_y3": 221.35799999999995, "coord_origin": "TOPLEFT"}, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 110.25, "t": 228.84400000000005, "r": 114.896, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.25, "r_y0": 233.49, "r_x1": 114.896, "r_y1": 233.49, "r_x2": 114.896, "r_y2": 228.84400000000005, "r_x3": 110.25, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 175.366, "t": 228.84400000000005, "r": 186.983, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.366, "r_y0": 233.49, "r_x1": 186.983, "r_y1": 233.49, "r_x2": 186.983, "r_y2": 228.84400000000005, "r_x3": 175.366, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u30d5\u30a1\u30a4\u30eb\u6570", "orig": "\u30d5\u30a1\u30a4\u30eb\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 195.314, "t": 228.84400000000005, "r": 199.961, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.314, "r_y0": 233.49, "r_x1": 199.961, "r_y1": 233.49, "r_x2": 199.961, "r_y2": 228.84400000000005, "r_x3": 195.314, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 229.198, "t": 228.84400000000005, "r": 236.168, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.198, "r_y0": 233.49, "r_x1": 236.168, "r_y1": 233.49, "r_x2": 236.168, "r_y2": 228.84400000000005, "r_x3": 229.198, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 256.114, "t": 228.84400000000005, "r": 260.761, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.114, "r_y0": 233.49, "r_x1": 260.761, "r_y1": 233.49, "r_x2": 260.761, "r_y2": 228.84400000000005, "r_x3": 256.114, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 278.384, "t": 228.84400000000005, "r": 285.354, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.384, "r_y0": 233.49, "r_x1": 285.354, "r_y1": 233.49, "r_x2": 285.354, "r_y2": 228.84400000000005, "r_x3": 278.384, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 55.531, "t": 236.48199999999997, "r": 162.713, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 240.76800000000003, "r_x1": 162.713, "r_y1": 240.76800000000003, "r_x2": 162.713, "r_y2": 236.48199999999997, "r_x3": 55.531, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 184.397, "t": 236.48199999999997, "r": 189.565, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.397, "r_y0": 240.76800000000003, "r_x1": 189.565, "r_y1": 240.76800000000003, "r_x2": 189.565, "r_y2": 236.48199999999997, "r_x3": 184.397, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 208.99, "t": 236.48199999999997, "r": 214.158, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.99, "r_y0": 240.76800000000003, "r_x1": 214.158, "r_y1": 240.76800000000003, "r_x2": 214.158, "r_y2": 236.48199999999997, "r_x3": 208.99, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 234.875, "t": 236.48199999999997, "r": 237.458, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.875, "r_y0": 240.76800000000003, "r_x1": 237.458, "r_y1": 240.76800000000003, "r_x2": 237.458, "r_y2": 236.48199999999997, "r_x3": 234.875, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 256.884, "t": 236.48199999999997, "r": 264.636, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 240.76800000000003, "r_x1": 264.636, "r_y1": 240.76800000000003, "r_x2": 264.636, "r_y2": 236.48199999999997, "r_x3": 256.884, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 284.061, "t": 236.48199999999997, "r": 286.644, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.061, "r_y0": 240.76800000000003, "r_x1": 286.644, "r_y1": 240.76800000000003, "r_x2": 286.644, "r_y2": 236.48199999999997, "r_x3": 284.061, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 55.531, "t": 242.67600000000004, "r": 139.722, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 246.962, "r_x1": 139.722, "r_y1": 246.962, "r_x2": 139.722, "r_y2": 242.67600000000004, "r_x3": 55.531, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 183.105, "t": 242.67600000000004, "r": 190.857, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 246.962, "r_x1": 190.857, "r_y1": 246.962, "r_x2": 190.857, "r_y2": 242.67600000000004, "r_x3": 183.105, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 207.698, "t": 242.67600000000004, "r": 215.45, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.698, "r_y0": 246.962, "r_x1": 215.45, "r_y1": 246.962, "r_x2": 215.45, "r_y2": 242.67600000000004, "r_x3": 207.698, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 234.875, "t": 242.67600000000004, "r": 237.458, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.875, "r_y0": 246.962, "r_x1": 237.458, "r_y1": 246.962, "r_x2": 237.458, "r_y2": 242.67600000000004, "r_x3": 234.875, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 256.884, "t": 242.67600000000004, "r": 264.636, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 246.962, "r_x1": 264.636, "r_y1": 246.962, "r_x2": 264.636, "r_y2": 242.67600000000004, "r_x3": 256.884, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 284.061, "t": 242.67600000000004, "r": 286.644, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.061, "r_y0": 246.962, "r_x1": 286.644, "r_y1": 246.962, "r_x2": 286.644, "r_y2": 242.67600000000004, "r_x3": 284.061, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 55.531, "t": 248.976, "r": 74.118, "b": 253.62199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 253.62199999999996, "r_x1": 74.118, "r_y1": 253.62199999999996, "r_x2": 74.118, "r_y2": 248.976, "r_x3": 55.531, "r_y3": 248.976, "coord_origin": "TOPLEFT"}, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 92.698, "t": 249.64499999999998, "r": 103.034, "b": 253.93100000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.698, "r_y0": 253.93100000000004, "r_x1": 103.034, "r_y1": 253.93100000000004, "r_x2": 103.034, "r_y2": 249.64499999999998, "r_x3": 92.698, "r_y3": 249.64499999999998, "coord_origin": "TOPLEFT"}, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 103.034, "t": 248.976, "r": 114.651, "b": 253.62199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.034, "r_y0": 253.62199999999996, "r_x1": 114.651, "r_y1": 253.62199999999996, "r_x2": 114.651, "r_y2": 248.976, "r_x3": 103.034, "r_y3": 248.976, "coord_origin": "TOPLEFT"}, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 183.105, "t": 248.87099999999998, "r": 190.857, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 253.15700000000004, "r_x1": 190.857, "r_y1": 253.15700000000004, "r_x2": 190.857, "r_y2": 248.87099999999998, "r_x3": 183.105, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 210.282, "t": 248.87099999999998, "r": 212.865, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 253.15700000000004, "r_x1": 212.865, "r_y1": 253.15700000000004, "r_x2": 212.865, "r_y2": 248.87099999999998, "r_x3": 210.282, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 232.292, "t": 248.87099999999998, "r": 240.043, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 253.15700000000004, "r_x1": 240.043, "r_y1": 253.15700000000004, "r_x2": 240.043, "r_y2": 248.87099999999998, "r_x3": 232.292, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 256.884, "t": 248.87099999999998, "r": 264.636, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 253.15700000000004, "r_x1": 264.636, "r_y1": 253.15700000000004, "r_x2": 264.636, "r_y2": 248.87099999999998, "r_x3": 256.884, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 82, "label": "text", "bbox": {"l": 281.477, "t": 248.87099999999998, "r": 289.229, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 253.15700000000004, "r_x1": 289.229, "r_y1": 253.15700000000004, "r_x2": 289.229, "r_y2": 248.87099999999998, "r_x3": 281.477, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 83, "label": "text", "bbox": {"l": 55.531, "t": 256.461, "r": 71.794, "b": 261.10699999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 261.10699999999997, "r_x1": 71.794, "r_y1": 261.10699999999997, "r_x2": 71.794, "r_y2": 256.461, "r_x3": 55.531, "r_y3": 256.461, "coord_origin": "TOPLEFT"}, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 88.053, "t": 257.13, "r": 93.22, "b": 261.41600000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.053, "r_y0": 261.41600000000005, "r_x1": 93.22, "r_y1": 261.41600000000005, "r_x2": 93.22, "r_y2": 257.13, "r_x3": 88.053, "r_y3": 257.13, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 93.22, "t": 256.461, "r": 104.837, "b": 261.10699999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.22, "r_y0": 261.10699999999997, "r_x1": 104.837, "r_y1": 261.10699999999997, "r_x2": 104.837, "r_y2": 256.461, "r_x3": 93.22, "r_y3": 256.461, "coord_origin": "TOPLEFT"}, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 86, "label": "text", "bbox": {"l": 116.451, "t": 257.13, "r": 129.882, "b": 261.41600000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.451, "r_y0": 261.41600000000005, "r_x1": 129.882, "r_y1": 261.41600000000005, "r_x2": 129.882, "r_y2": 257.13, "r_x3": 116.451, "r_y3": 257.13, "coord_origin": "TOPLEFT"}, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 183.105, "t": 256.356, "r": 190.857, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 260.64200000000005, "r_x1": 190.857, "r_y1": 260.64200000000005, "r_x2": 190.857, "r_y2": 256.356, "r_x3": 183.105, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 88, "label": "text", "bbox": {"l": 210.282, "t": 256.356, "r": 212.865, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 260.64200000000005, "r_x1": 212.865, "r_y1": 260.64200000000005, "r_x2": 212.865, "r_y2": 256.356, "r_x3": 210.282, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 232.292, "t": 256.356, "r": 240.043, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 260.64200000000005, "r_x1": 240.043, "r_y1": 260.64200000000005, "r_x2": 240.043, "r_y2": 256.356, "r_x3": 232.292, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 256.884, "t": 256.356, "r": 264.636, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 260.64200000000005, "r_x1": 264.636, "r_y1": 260.64200000000005, "r_x2": 264.636, "r_y2": 256.356, "r_x3": 256.884, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 91, "label": "text", "bbox": {"l": 281.477, "t": 256.356, "r": 289.229, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 260.64200000000005, "r_x1": 289.229, "r_y1": 260.64200000000005, "r_x2": 289.229, "r_y2": 256.356, "r_x3": 281.477, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 92, "label": "text", "bbox": {"l": 55.531, "t": 263.688, "r": 57.854, "b": 268.33399999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 268.33399999999995, "r_x1": 57.854, "r_y1": 268.33399999999995, "r_x2": 57.854, "r_y2": 263.688, "r_x3": 55.531, "r_y3": 263.688, "coord_origin": "TOPLEFT"}, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 93, "label": "text", "bbox": {"l": 60.177, "t": 264.35699999999997, "r": 65.344, "b": 268.644, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.177, "r_y0": 268.644, "r_x1": 65.344, "r_y1": 268.644, "r_x2": 65.344, "r_y2": 264.35699999999997, "r_x3": 60.177, "r_y3": 264.35699999999997, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 94, "label": "text", "bbox": {"l": 65.344, "t": 263.688, "r": 90.902, "b": 268.33399999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.344, "r_y0": 268.33399999999995, "r_x1": 90.902, "r_y1": 268.33399999999995, "r_x2": 90.902, "r_y2": 263.688, "r_x3": 65.344, "r_y3": 263.688, "coord_origin": "TOPLEFT"}, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 95, "label": "text", "bbox": {"l": 116.451, "t": 264.35699999999997, "r": 129.882, "b": 268.644, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.451, "r_y0": 268.644, "r_x1": 129.882, "r_y1": 268.644, "r_x2": 129.882, "r_y2": 264.35699999999997, "r_x3": 116.451, "r_y3": 264.35699999999997, "coord_origin": "TOPLEFT"}, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 96, "label": "text", "bbox": {"l": 183.105, "t": 263.58299999999997, "r": 190.857, "b": 267.869, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 267.869, "r_x1": 190.857, "r_y1": 267.869, "r_x2": 190.857, "r_y2": 263.58299999999997, "r_x3": 183.105, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 97, "label": "text", "bbox": {"l": 210.282, "t": 263.58299999999997, "r": 212.865, "b": 267.869, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 267.869, "r_x1": 212.865, "r_y1": 267.869, "r_x2": 212.865, "r_y2": 263.58299999999997, "r_x3": 210.282, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 98, "label": "text", "bbox": {"l": 232.292, "t": 263.58299999999997, "r": 240.043, "b": 267.869, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 267.869, "r_x1": 240.043, "r_y1": 267.869, "r_x2": 240.043, "r_y2": 263.58299999999997, "r_x3": 232.292, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 99, "label": "text", "bbox": {"l": 256.884, "t": 263.58299999999997, "r": 264.636, "b": 267.869, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 267.869, "r_x1": 264.636, "r_y1": 267.869, "r_x2": 264.636, "r_y2": 263.58299999999997, "r_x3": 256.884, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 100, "label": "text", "bbox": {"l": 281.477, "t": 263.58299999999997, "r": 289.229, "b": 267.869, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 267.869, "r_x1": 289.229, "r_y1": 267.869, "r_x2": 289.229, "r_y2": 263.58299999999997, "r_x3": 281.477, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 101, "label": "text", "bbox": {"l": 55.531, "t": 270.91600000000005, "r": 78.765, "b": 275.562, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 275.562, "r_x1": 78.765, "r_y1": 275.562, "r_x2": 78.765, "r_y2": 270.91600000000005, "r_x3": 55.531, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 102, "label": "text", "bbox": {"l": 101.99, "t": 271.58500000000004, "r": 109.742, "b": 275.871, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.99, "r_y0": 275.871, "r_x1": 109.742, "r_y1": 275.871, "r_x2": 109.742, "r_y2": 271.58500000000004, "r_x3": 101.99, "r_y3": 271.58500000000004, "coord_origin": "TOPLEFT"}, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 103, "label": "text", "bbox": {"l": 109.742, "t": 270.91600000000005, "r": 112.065, "b": 275.562, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 109.742, "r_y0": 275.562, "r_x1": 112.065, "r_y1": 275.562, "r_x2": 112.065, "r_y2": 270.91600000000005, "r_x3": 109.742, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 104, "label": "text", "bbox": {"l": 114.388, "t": 271.58500000000004, "r": 122.139, "b": 275.871, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 114.388, "r_y0": 275.871, "r_x1": 122.139, "r_y1": 275.871, "r_x2": 122.139, "r_y2": 271.58500000000004, "r_x3": 114.388, "r_y3": 271.58500000000004, "coord_origin": "TOPLEFT"}, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 105, "label": "text", "bbox": {"l": 122.14, "t": 270.91600000000005, "r": 124.463, "b": 275.562, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.14, "r_y0": 275.562, "r_x1": 124.463, "r_y1": 275.562, "r_x2": 124.463, "r_y2": 270.91600000000005, "r_x3": 122.14, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 106, "label": "text", "bbox": {"l": 184.397, "t": 270.80999999999995, "r": 189.565, "b": 275.096, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.397, "r_y0": 275.096, "r_x1": 189.565, "r_y1": 275.096, "r_x2": 189.565, "r_y2": 270.80999999999995, "r_x3": 184.397, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 107, "label": "text", "bbox": {"l": 210.282, "t": 270.80999999999995, "r": 212.865, "b": 275.096, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 275.096, "r_x1": 212.865, "r_y1": 275.096, "r_x2": 212.865, "r_y2": 270.80999999999995, "r_x3": 210.282, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 108, "label": "text", "bbox": {"l": 233.583, "t": 270.80999999999995, "r": 238.751, "b": 275.096, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.583, "r_y0": 275.096, "r_x1": 238.751, "r_y1": 275.096, "r_x2": 238.751, "r_y2": 270.80999999999995, "r_x3": 233.583, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 109, "label": "text", "bbox": {"l": 256.884, "t": 270.80999999999995, "r": 264.636, "b": 275.096, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 275.096, "r_x1": 264.636, "r_y1": 275.096, "r_x2": 264.636, "r_y2": 270.80999999999995, "r_x3": 256.884, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 110, "label": "text", "bbox": {"l": 281.477, "t": 270.80999999999995, "r": 289.229, "b": 275.096, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 275.096, "r_x1": 289.229, "r_y1": 275.096, "r_x2": 289.229, "r_y2": 270.80999999999995, "r_x3": 281.477, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 111, "label": "text", "bbox": {"l": 55.531, "t": 279.07000000000005, "r": 68.686, "b": 283.356, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 283.356, "r_x1": 68.686, "r_y1": 283.356, "r_x2": 68.686, "r_y2": 279.07000000000005, "r_x3": 55.531, "r_y3": 279.07000000000005, "coord_origin": "TOPLEFT"}, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 112, "label": "text", "bbox": {"l": 68.686, "t": 278.40099999999995, "r": 87.273, "b": 283.047, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 68.686, "r_y0": 283.047, "r_x1": 87.273, "r_y1": 283.047, "r_x2": 87.273, "r_y2": 278.40099999999995, "r_x3": 68.686, "r_y3": 278.40099999999995, "coord_origin": "TOPLEFT"}, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 113, "label": "text", "bbox": {"l": 183.105, "t": 278.03700000000003, "r": 190.857, "b": 282.323, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 282.323, "r_x1": 190.857, "r_y1": 282.323, "r_x2": 190.857, "r_y2": 278.03700000000003, "r_x3": 183.105, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 114, "label": "text", "bbox": {"l": 208.99, "t": 278.03700000000003, "r": 214.158, "b": 282.323, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.99, "r_y0": 282.323, "r_x1": 214.158, "r_y1": 282.323, "r_x2": 214.158, "r_y2": 278.03700000000003, "r_x3": 208.99, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 115, "label": "text", "bbox": {"l": 233.583, "t": 278.03700000000003, "r": 238.751, "b": 282.323, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.583, "r_y0": 282.323, "r_x1": 238.751, "r_y1": 282.323, "r_x2": 238.751, "r_y2": 278.03700000000003, "r_x3": 233.583, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 116, "label": "text", "bbox": {"l": 256.884, "t": 278.03700000000003, "r": 264.636, "b": 282.323, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 282.323, "r_x1": 264.636, "r_y1": 282.323, "r_x2": 264.636, "r_y2": 278.03700000000003, "r_x3": 256.884, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 117, "label": "text", "bbox": {"l": 282.769, "t": 278.03700000000003, "r": 287.937, "b": 282.323, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.769, "r_y0": 282.323, "r_x1": 287.937, "r_y1": 282.323, "r_x2": 287.937, "r_y2": 278.03700000000003, "r_x3": 282.769, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 118, "label": "text", "bbox": {"l": 169.615, "t": 285.628, "r": 171.938, "b": 290.274, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.615, "r_y0": 290.274, "r_x1": 171.938, "r_y1": 290.274, "r_x2": 171.938, "r_y2": 285.628, "r_x3": 169.615, "r_y3": 285.628, "coord_origin": "TOPLEFT"}, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 119, "label": "text", "bbox": {"l": 183.105, "t": 285.522, "r": 190.857, "b": 289.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 289.809, "r_x1": 190.857, "r_y1": 289.809, "r_x2": 190.857, "r_y2": 285.522, "r_x3": 183.105, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 120, "label": "text", "bbox": {"l": 207.698, "t": 285.522, "r": 215.45, "b": 289.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.698, "r_y0": 289.809, "r_x1": 215.45, "r_y1": 289.809, "r_x2": 215.45, "r_y2": 285.522, "r_x3": 207.698, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 121, "label": "text", "bbox": {"l": 232.292, "t": 285.522, "r": 240.043, "b": 289.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 289.809, "r_x1": 240.043, "r_y1": 289.809, "r_x2": 240.043, "r_y2": 285.522, "r_x3": 232.292, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 122, "label": "text", "bbox": {"l": 255.765, "t": 285.522, "r": 265.752, "b": 289.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.765, "r_y0": 289.809, "r_x1": 265.752, "r_y1": 289.809, "r_x2": 265.752, "r_y2": 285.522, "r_x3": 255.765, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 123, "label": "text", "bbox": {"l": 281.477, "t": 285.522, "r": 289.229, "b": 289.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 289.809, "r_x1": 289.229, "r_y1": 289.809, "r_x2": 289.229, "r_y2": 285.522, "r_x3": 281.477, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ched", "ched", "ched", "lcel", "ched", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 10, "num_cols": 6, "table_cells": [{"bbox": {"l": 209.933, "t": 221.35799999999995, "r": 223.873, "b": 226.00400000000002, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 4, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 263.765, "t": 221.35799999999995, "r": 273.058, "b": 226.00400000000002, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 6, "text": "\u53c2\u8003\u6587\u732e", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 110.25, "t": 228.84400000000005, "r": 114.896, "b": 233.49, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u51fa\u5178", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 175.366, "t": 228.84400000000005, "r": 199.961, "b": 233.49, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "\u30d5\u30a1\u30a4\u30eb\u6570 \u82f1\u8a9e", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 229.198, "t": 228.84400000000005, "r": 236.168, "b": 233.49, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "\u65e5\u672c\u8a9e", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 256.114, "t": 228.84400000000005, "r": 260.761, "b": 233.49, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "\u82f1\u8a9e", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 278.384, "t": 228.84400000000005, "r": 285.354, "b": 233.49, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "\u65e5\u672c\u8a9e", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 236.48199999999997, "r": 162.713, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Association for Computational Linguistics(ACL2003)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 184.397, "t": 236.48199999999997, "r": 189.565, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "65", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 208.99, "t": 236.48199999999997, "r": 214.158, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "65", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 234.875, "t": 236.48199999999997, "r": 237.458, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 236.48199999999997, "r": 264.636, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 284.061, "t": 236.48199999999997, "r": 286.644, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 242.67600000000004, "r": 139.722, "b": 246.962, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Computational Linguistics(COLING2002)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 183.105, "t": 242.67600000000004, "r": 190.857, "b": 246.962, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "140", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 207.698, "t": 242.67600000000004, "r": 215.45, "b": 246.962, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "140", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 234.875, "t": 242.67600000000004, "r": 237.458, "b": 246.962, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 242.67600000000004, "r": 264.636, "b": 246.962, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 284.061, "t": 242.67600000000004, "r": 286.644, "b": 246.962, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 248.976, "r": 114.651, "b": 253.93100000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a 2003 \u5e74\u7dcf\u5408\u5927\u4f1a", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 183.105, "t": 248.87099999999998, "r": 190.857, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "150", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 210.282, "t": 248.87099999999998, "r": 212.865, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "8", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 232.292, "t": 248.87099999999998, "r": 240.043, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "142", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 248.87099999999998, "r": 264.636, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "223", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 281.477, "t": 248.87099999999998, "r": 289.229, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "147", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 256.461, "r": 129.882, "b": 261.41600000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c 65 \u56de\u5168\u56fd\u5927\u4f1a (2003)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 183.105, "t": 256.356, "r": 190.857, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "177", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 210.282, "t": 256.356, "r": 212.865, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 232.292, "t": 256.356, "r": 240.043, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "176", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 256.356, "r": 264.636, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 281.477, "t": 256.356, "r": 289.229, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "236", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 263.688, "r": 129.882, "b": 268.644, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u7b2c 17 \u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a (2003)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 183.105, "t": 263.58299999999997, "r": 190.857, "b": 267.869, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "208", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 210.282, "t": 263.58299999999997, "r": 212.865, "b": 267.869, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "5", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 232.292, "t": 263.58299999999997, "r": 240.043, "b": 267.869, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "203", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 263.58299999999997, "r": 264.636, "b": 267.869, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "152", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 281.477, "t": 263.58299999999997, "r": 289.229, "b": 267.869, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "244", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 270.91600000000005, "r": 124.463, "b": 275.871, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c 146 \u301c 155 \u56de", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 184.397, "t": 270.80999999999995, "r": 189.565, "b": 275.096, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "98", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 210.282, "t": 270.80999999999995, "r": 212.865, "b": 275.096, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "2", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 233.583, "t": 270.80999999999995, "r": 238.751, "b": 275.096, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "96", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 270.80999999999995, "r": 264.636, "b": 275.096, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 281.477, "t": 270.80999999999995, "r": 289.229, "b": 275.096, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "232", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 278.40099999999995, "r": 87.273, "b": 283.356, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "WWW \u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 183.105, "t": 278.03700000000003, "r": 190.857, "b": 282.323, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "107", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 208.99, "t": 278.03700000000003, "r": 214.158, "b": 282.323, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "73", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 233.583, "t": 278.03700000000003, "r": 238.751, "b": 282.323, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "34", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 278.03700000000003, "r": 264.636, "b": 282.323, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "147", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 282.769, "t": 278.03700000000003, "r": 287.937, "b": 282.323, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "96", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 169.615, "t": 285.628, "r": 171.938, "b": 290.274, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u8a08", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 183.105, "t": 285.522, "r": 190.857, "b": 289.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "945", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 207.698, "t": 285.522, "r": 215.45, "b": 289.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "294", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 232.292, "t": 285.522, "r": 240.043, "b": 289.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "651", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 255.765, "t": 285.522, "r": 265.752, "b": 289.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "1122", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 281.477, "t": 285.522, "r": 289.229, "b": 289.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "955", "column_header": false, "row_header": false, "row_section": false}]}, "7": {"label": "table", "id": 7, "page_no": 7, "cluster": {"id": 7, "label": "table", "bbox": {"l": 304.9219970703125, "t": 218.51486206054688, "r": 550.2321166992188, "b": 287.90069580078125, "coord_origin": "TOPLEFT"}, "confidence": 0.8899767994880676, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.049, "r_y0": 226.67100000000005, "r_x1": 542.0, "r_y1": 226.67100000000005, "r_x2": 542.0, "r_y2": 221.68899999999996, "r_x3": 459.049, "r_y3": 221.68899999999996, "coord_origin": "TOPLEFT"}, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.822, "r_y0": 232.88099999999997, "r_x1": 507.226, "r_y1": 232.88099999999997, "r_x2": 507.226, "r_y2": 227.899, "r_x3": 493.822, "r_y3": 227.899, "coord_origin": "TOPLEFT"}, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.244, "r_y0": 241.79399999999998, "r_x1": 407.346, "r_y1": 241.79399999999998, "r_x2": 407.346, "r_y2": 236.812, "r_x3": 393.244, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.097, "r_y0": 226.62099999999998, "r_x1": 438.015, "r_y1": 226.62099999999998, "r_x2": 438.015, "r_y2": 221.639, "r_x3": 392.097, "r_y3": 221.639, "coord_origin": "TOPLEFT"}, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.183, "r_y0": 241.79399999999998, "r_x1": 440.988, "r_y1": 241.79399999999998, "r_x2": 440.988, "r_y2": 236.812, "r_x3": 427.183, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.383, "r_y0": 241.79399999999998, "r_x1": 482.485, "r_y1": 241.79399999999998, "r_x2": 482.485, "r_y2": 236.812, "r_x3": 468.383, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.926, "r_y0": 241.79399999999998, "r_x1": 530.73, "r_y1": 241.79399999999998, "r_x2": 530.73, "r_y2": 236.812, "r_x3": 516.926, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 249.65700000000004, "r_x1": 364.656, "r_y1": 249.65700000000004, "r_x2": 364.656, "r_y2": 244.67600000000004, "r_x3": 306.115, "r_y3": 244.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Nonvested on January 1", "orig": "Nonvested on January 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 249.96000000000004, "r_x1": 403.755, "r_y1": 249.96000000000004, "r_x2": 403.755, "r_y2": 244.97799999999995, "r_x3": 396.247, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "1.1", "orig": "1.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.818, "r_y0": 249.96000000000004, "r_x1": 437.327, "r_y1": 249.96000000000004, "r_x2": 437.327, "r_y2": 244.97799999999995, "r_x3": 429.818, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.529, "r_y0": 249.96000000000004, "r_x1": 483.55, "r_y1": 249.96000000000004, "r_x2": 483.55, "r_y2": 244.97799999999995, "r_x3": 465.529, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "90.10 $", "orig": "90.10 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.448, "r_y0": 249.96000000000004, "r_x1": 531.47, "r_y1": 249.96000000000004, "r_x2": 531.47, "r_y2": 244.97799999999995, "r_x3": 513.448, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 258.731, "r_x1": 325.627, "r_y1": 258.731, "r_x2": 325.627, "r_y2": 253.74900000000002, "r_x3": 306.115, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 258.731, "r_x1": 403.755, "r_y1": 258.731, "r_x2": 403.755, "r_y2": 253.74900000000002, "r_x3": 396.247, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.818, "r_y0": 258.731, "r_x1": 437.327, "r_y1": 258.731, "r_x2": 437.327, "r_y2": 253.74900000000002, "r_x3": 429.818, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.436, "r_y0": 258.731, "r_x1": 482.548, "r_y1": 258.731, "r_x2": 482.548, "r_y2": 253.74900000000002, "r_x3": 466.436, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 514.291, "r_y0": 258.731, "r_x1": 530.81, "r_y1": 258.731, "r_x2": 530.81, "r_y2": 253.74900000000002, "r_x3": 514.291, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 266.595, "r_x1": 322.629, "r_y1": 266.595, "r_x2": 322.629, "r_y2": 261.61300000000006, "r_x3": 306.115, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.432, "r_y0": 266.595, "r_x1": 405.536, "r_y1": 266.595, "r_x2": 405.536, "r_y2": 261.61300000000006, "r_x3": 394.432, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "(0.5)", "orig": "(0.5)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.702, "r_y0": 266.595, "r_x1": 438.806, "r_y1": 266.595, "r_x2": 438.806, "r_y2": 261.61300000000006, "r_x3": 427.702, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.555, "r_y0": 266.595, "r_x1": 482.07, "r_y1": 266.595, "r_x2": 482.07, "r_y2": 261.61300000000006, "r_x3": 468.555, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.019, "r_y0": 266.595, "r_x1": 529.534, "r_y1": 266.595, "r_x2": 529.534, "r_y2": 261.61300000000006, "r_x3": 516.019, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 274.688, "r_x1": 356.248, "r_y1": 274.688, "r_x2": 356.248, "r_y2": 269.706, "r_x3": 306.115, "r_y3": 269.706, "coord_origin": "TOPLEFT"}, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.432, "r_y0": 275.366, "r_x1": 405.536, "r_y1": 275.366, "r_x2": 405.536, "r_y2": 270.384, "r_x3": 394.432, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.028, "r_y0": 275.366, "r_x1": 436.428, "r_y1": 275.366, "r_x2": 436.428, "r_y2": 270.384, "r_x3": 431.028, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.831, "r_y0": 275.366, "r_x1": 482.35, "r_y1": 275.366, "r_x2": 482.35, "r_y2": 270.384, "r_x3": 465.831, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.019, "r_y0": 275.366, "r_x1": 529.534, "r_y1": 275.366, "r_x2": 529.534, "r_y2": 270.384, "r_x3": 516.019, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 283.532, "r_x1": 373.358, "r_y1": 283.532, "r_x2": 373.358, "r_y2": 278.55100000000004, "r_x3": 306.115, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 283.532, "r_x1": 403.755, "r_y1": 283.532, "r_x2": 403.755, "r_y2": 278.55100000000004, "r_x3": 396.247, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.516, "r_y0": 283.532, "r_x1": 437.025, "r_y1": 283.532, "r_x2": 437.025, "r_y2": 278.55100000000004, "r_x3": 429.516, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.714, "r_y0": 283.532, "r_x1": 484.74, "r_y1": 283.532, "r_x2": 484.74, "r_y2": 278.55100000000004, "r_x3": 463.714, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.995, "r_y0": 283.532, "r_x1": 534.02, "r_y1": 283.532, "r_x2": 534.02, "r_y2": 278.55100000000004, "r_x3": 512.995, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 124, "label": "text", "bbox": {"l": 459.049, "t": 221.68899999999996, "r": 542.0, "b": 226.67100000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.049, "r_y0": 226.67100000000005, "r_x1": 542.0, "r_y1": 226.67100000000005, "r_x2": 542.0, "r_y2": 221.68899999999996, "r_x3": 459.049, "r_y3": 221.68899999999996, "coord_origin": "TOPLEFT"}, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 125, "label": "text", "bbox": {"l": 493.822, "t": 227.899, "r": 507.226, "b": 232.88099999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.822, "r_y0": 232.88099999999997, "r_x1": 507.226, "r_y1": 232.88099999999997, "r_x2": 507.226, "r_y2": 227.899, "r_x3": 493.822, "r_y3": 227.899, "coord_origin": "TOPLEFT"}, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 126, "label": "text", "bbox": {"l": 393.244, "t": 236.812, "r": 407.346, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.244, "r_y0": 241.79399999999998, "r_x1": 407.346, "r_y1": 241.79399999999998, "r_x2": 407.346, "r_y2": 236.812, "r_x3": 393.244, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 127, "label": "text", "bbox": {"l": 392.097, "t": 221.639, "r": 438.015, "b": 226.62099999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.097, "r_y0": 226.62099999999998, "r_x1": 438.015, "r_y1": 226.62099999999998, "r_x2": 438.015, "r_y2": 221.639, "r_x3": 392.097, "r_y3": 221.639, "coord_origin": "TOPLEFT"}, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 128, "label": "text", "bbox": {"l": 427.183, "t": 236.812, "r": 440.988, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.183, "r_y0": 241.79399999999998, "r_x1": 440.988, "r_y1": 241.79399999999998, "r_x2": 440.988, "r_y2": 236.812, "r_x3": 427.183, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 129, "label": "text", "bbox": {"l": 468.383, "t": 236.812, "r": 482.485, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.383, "r_y0": 241.79399999999998, "r_x1": 482.485, "r_y1": 241.79399999999998, "r_x2": 482.485, "r_y2": 236.812, "r_x3": 468.383, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 130, "label": "text", "bbox": {"l": 516.926, "t": 236.812, "r": 530.73, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.926, "r_y0": 241.79399999999998, "r_x1": 530.73, "r_y1": 241.79399999999998, "r_x2": 530.73, "r_y2": 236.812, "r_x3": 516.926, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 131, "label": "text", "bbox": {"l": 306.115, "t": 244.67600000000004, "r": 364.656, "b": 249.65700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 249.65700000000004, "r_x1": 364.656, "r_y1": 249.65700000000004, "r_x2": 364.656, "r_y2": 244.67600000000004, "r_x3": 306.115, "r_y3": 244.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Nonvested on January 1", "orig": "Nonvested on January 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 132, "label": "text", "bbox": {"l": 396.247, "t": 244.97799999999995, "r": 403.755, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 249.96000000000004, "r_x1": 403.755, "r_y1": 249.96000000000004, "r_x2": 403.755, "r_y2": 244.97799999999995, "r_x3": 396.247, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "1.1", "orig": "1.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 133, "label": "text", "bbox": {"l": 429.818, "t": 244.97799999999995, "r": 437.327, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.818, "r_y0": 249.96000000000004, "r_x1": 437.327, "r_y1": 249.96000000000004, "r_x2": 437.327, "r_y2": 244.97799999999995, "r_x3": 429.818, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 134, "label": "text", "bbox": {"l": 465.529, "t": 244.97799999999995, "r": 483.55, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.529, "r_y0": 249.96000000000004, "r_x1": 483.55, "r_y1": 249.96000000000004, "r_x2": 483.55, "r_y2": 244.97799999999995, "r_x3": 465.529, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "90.10 $", "orig": "90.10 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 135, "label": "text", "bbox": {"l": 513.448, "t": 244.97799999999995, "r": 531.47, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.448, "r_y0": 249.96000000000004, "r_x1": 531.47, "r_y1": 249.96000000000004, "r_x2": 531.47, "r_y2": 244.97799999999995, "r_x3": 513.448, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 136, "label": "text", "bbox": {"l": 306.115, "t": 253.74900000000002, "r": 325.627, "b": 258.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 258.731, "r_x1": 325.627, "r_y1": 258.731, "r_x2": 325.627, "r_y2": 253.74900000000002, "r_x3": 306.115, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 137, "label": "text", "bbox": {"l": 396.247, "t": 253.74900000000002, "r": 403.755, "b": 258.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 258.731, "r_x1": 403.755, "r_y1": 258.731, "r_x2": 403.755, "r_y2": 253.74900000000002, "r_x3": 396.247, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 138, "label": "text", "bbox": {"l": 429.818, "t": 253.74900000000002, "r": 437.327, "b": 258.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.818, "r_y0": 258.731, "r_x1": 437.327, "r_y1": 258.731, "r_x2": 437.327, "r_y2": 253.74900000000002, "r_x3": 429.818, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 139, "label": "text", "bbox": {"l": 466.436, "t": 253.74900000000002, "r": 482.548, "b": 258.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.436, "r_y0": 258.731, "r_x1": 482.548, "r_y1": 258.731, "r_x2": 482.548, "r_y2": 253.74900000000002, "r_x3": 466.436, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 140, "label": "text", "bbox": {"l": 514.291, "t": 253.74900000000002, "r": 530.81, "b": 258.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 514.291, "r_y0": 258.731, "r_x1": 530.81, "r_y1": 258.731, "r_x2": 530.81, "r_y2": 253.74900000000002, "r_x3": 514.291, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 141, "label": "text", "bbox": {"l": 306.115, "t": 261.61300000000006, "r": 322.629, "b": 266.595, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 266.595, "r_x1": 322.629, "r_y1": 266.595, "r_x2": 322.629, "r_y2": 261.61300000000006, "r_x3": 306.115, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 142, "label": "text", "bbox": {"l": 394.432, "t": 261.61300000000006, "r": 405.536, "b": 266.595, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.432, "r_y0": 266.595, "r_x1": 405.536, "r_y1": 266.595, "r_x2": 405.536, "r_y2": 261.61300000000006, "r_x3": 394.432, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "(0.5)", "orig": "(0.5)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 143, "label": "text", "bbox": {"l": 427.702, "t": 261.61300000000006, "r": 438.806, "b": 266.595, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.702, "r_y0": 266.595, "r_x1": 438.806, "r_y1": 266.595, "r_x2": 438.806, "r_y2": 261.61300000000006, "r_x3": 427.702, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 144, "label": "text", "bbox": {"l": 468.555, "t": 261.61300000000006, "r": 482.07, "b": 266.595, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.555, "r_y0": 266.595, "r_x1": 482.07, "r_y1": 266.595, "r_x2": 482.07, "r_y2": 261.61300000000006, "r_x3": 468.555, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 145, "label": "text", "bbox": {"l": 516.019, "t": 261.61300000000006, "r": 529.534, "b": 266.595, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.019, "r_y0": 266.595, "r_x1": 529.534, "r_y1": 266.595, "r_x2": 529.534, "r_y2": 261.61300000000006, "r_x3": 516.019, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 146, "label": "text", "bbox": {"l": 306.115, "t": 269.706, "r": 356.248, "b": 274.688, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 274.688, "r_x1": 356.248, "r_y1": 274.688, "r_x2": 356.248, "r_y2": 269.706, "r_x3": 306.115, "r_y3": 269.706, "coord_origin": "TOPLEFT"}, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 147, "label": "text", "bbox": {"l": 394.432, "t": 270.384, "r": 405.536, "b": 275.366, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.432, "r_y0": 275.366, "r_x1": 405.536, "r_y1": 275.366, "r_x2": 405.536, "r_y2": 270.384, "r_x3": 394.432, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 148, "label": "text", "bbox": {"l": 431.028, "t": 270.384, "r": 436.428, "b": 275.366, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.028, "r_y0": 275.366, "r_x1": 436.428, "r_y1": 275.366, "r_x2": 436.428, "r_y2": 270.384, "r_x3": 431.028, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 149, "label": "text", "bbox": {"l": 465.831, "t": 270.384, "r": 482.35, "b": 275.366, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.831, "r_y0": 275.366, "r_x1": 482.35, "r_y1": 275.366, "r_x2": 482.35, "r_y2": 270.384, "r_x3": 465.831, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 150, "label": "text", "bbox": {"l": 516.019, "t": 270.384, "r": 529.534, "b": 275.366, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.019, "r_y0": 275.366, "r_x1": 529.534, "r_y1": 275.366, "r_x2": 529.534, "r_y2": 270.384, "r_x3": 516.019, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 151, "label": "text", "bbox": {"l": 306.115, "t": 278.55100000000004, "r": 373.358, "b": 283.532, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 283.532, "r_x1": 373.358, "r_y1": 283.532, "r_x2": 373.358, "r_y2": 278.55100000000004, "r_x3": 306.115, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 152, "label": "text", "bbox": {"l": 396.247, "t": 278.55100000000004, "r": 403.755, "b": 283.532, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 283.532, "r_x1": 403.755, "r_y1": 283.532, "r_x2": 403.755, "r_y2": 278.55100000000004, "r_x3": 396.247, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 153, "label": "text", "bbox": {"l": 429.516, "t": 278.55100000000004, "r": 437.025, "b": 283.532, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.516, "r_y0": 283.532, "r_x1": 437.025, "r_y1": 283.532, "r_x2": 437.025, "r_y2": 278.55100000000004, "r_x3": 429.516, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 154, "label": "text", "bbox": {"l": 463.714, "t": 278.55100000000004, "r": 484.74, "b": 283.532, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.714, "r_y0": 283.532, "r_x1": 484.74, "r_y1": 283.532, "r_x2": 484.74, "r_y2": 278.55100000000004, "r_x3": 463.714, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 155, "label": "text", "bbox": {"l": 512.995, "t": 278.55100000000004, "r": 534.02, "b": 283.532, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.995, "r_y0": 283.532, "r_x1": 534.02, "r_y1": 283.532, "r_x2": 534.02, "r_y2": 278.55100000000004, "r_x3": 512.995, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ecel", "ched", "lcel", "ched", "lcel", "nl", "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 7, "num_cols": 5, "table_cells": [{"bbox": {"l": 459.049, "t": 221.68899999999996, "r": 542.0, "b": 232.88099999999997, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 5, "text": "Weighted Average Grant Date Fair Value", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 393.244, "t": 236.812, "r": 407.346, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "RSUs", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 392.097, "t": 221.639, "r": 438.015, "b": 226.62099999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 3, "text": "Shares (in millions)", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 427.183, "t": 236.812, "r": 440.988, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "PSUs", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 468.383, "t": 236.812, "r": 482.485, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "RSUs", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 516.926, "t": 236.812, "r": 530.73, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PSUs", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 306.115, "t": 244.67600000000004, "r": 364.656, "b": 249.65700000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Nonvested on January 1", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 396.247, "t": 244.97799999999995, "r": 403.755, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "1.1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 429.818, "t": 244.97799999999995, "r": 437.327, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 465.529, "t": 244.97799999999995, "r": 483.55, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "90.10 $", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 513.448, "t": 244.97799999999995, "r": 531.47, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "$ 91.19", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 306.115, "t": 253.74900000000002, "r": 325.627, "b": 258.731, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Granted", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 396.247, "t": 253.74900000000002, "r": 403.755, "b": 258.731, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "0.5", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 429.818, "t": 253.74900000000002, "r": 437.327, "b": 258.731, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 466.436, "t": 253.74900000000002, "r": 482.548, "b": 258.731, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "117.44", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 514.291, "t": 253.74900000000002, "r": 530.81, "b": 258.731, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "122.41", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 306.115, "t": 261.61300000000006, "r": 322.629, "b": 266.595, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Vested", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 394.432, "t": 261.61300000000006, "r": 405.536, "b": 266.595, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "(0.5)", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 427.702, "t": 261.61300000000006, "r": 438.806, "b": 266.595, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "(0.1)", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 468.555, "t": 261.61300000000006, "r": 482.07, "b": 266.595, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "87.08", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 516.019, "t": 261.61300000000006, "r": 529.534, "b": 266.595, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "81.14", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 306.115, "t": 269.706, "r": 356.248, "b": 274.688, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Canceled or forfeited", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 394.432, "t": 270.384, "r": 405.536, "b": 275.366, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "(0.1)", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 431.028, "t": 270.384, "r": 436.428, "b": 275.366, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 465.831, "t": 270.384, "r": 482.35, "b": 275.366, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "102.01", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 516.019, "t": 270.384, "r": 529.534, "b": 275.366, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "92.18", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 306.115, "t": 278.55100000000004, "r": 373.358, "b": 283.532, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Nonvested on December 31", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 396.247, "t": 278.55100000000004, "r": 403.755, "b": 283.532, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "1.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 429.516, "t": 278.55100000000004, "r": 437.025, "b": 283.532, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 463.714, "t": 278.55100000000004, "r": 484.74, "b": 283.532, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "104.85 $", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 512.995, "t": 278.55100000000004, "r": 534.02, "b": 283.532, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "$ 104.51", "column_header": false, "row_header": false, "row_section": false}]}}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "caption", "id": 18, "page_no": 7, "cluster": {"id": 18, "label": "caption", "bbox": {"l": 53.812, "t": 208.54100000000005, "r": 385.934, "b": 216.02300000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.5986505746841431, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.812, "r_y0": 216.02300000000002, "r_x1": 385.934, "r_y1": 216.02300000000002, "r_x2": 385.934, "r_y2": 208.54100000000005, "r_x3": 53.812, "r_y3": 208.54100000000005, "coord_origin": "TOPLEFT"}, "text": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:", "orig": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:"}, {"label": "section_header", "id": 29, "page_no": 7, "cluster": {"id": 29, "label": "section_header", "bbox": {"l": 53.812, "t": 94.58900000000006, "r": 284.346, "b": 102.07100000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.46452972292900085, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.812, "r_y0": 102.07100000000003, "r_x1": 284.346, "r_y1": 102.07100000000003, "r_x2": 284.346, "r_y2": 94.58900000000006, "r_x3": 53.812, "r_y3": 94.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Japanese language (previously unseen by TableFormer):", "orig": "Japanese language (previously unseen by TableFormer):", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Japanese language (previously unseen by TableFormer):"}, {"label": "section_header", "id": 31, "page_no": 7, "cluster": {"id": 31, "label": "section_header", "bbox": {"l": 304.831, "t": 94.58900000000006, "r": 431.091, "b": 102.07100000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.4629225730895996, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 304.831, "r_y0": 102.07100000000003, "r_x1": 431.091, "r_y1": 102.07100000000003, "r_x2": 431.091, "r_y2": 94.58900000000006, "r_x3": 304.831, "r_y3": 94.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Example table from FinTabNet:", "orig": "Example table from FinTabNet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Example table from FinTabNet:"}, {"label": "list_item", "id": 21, "page_no": 7, "cluster": {"id": 21, "label": "list_item", "bbox": {"l": 53.286, "t": 78.995, "r": 499.556, "b": 86.47699999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.541211724281311, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.286, "r_y0": 86.47699999999998, "r_x1": 499.556, "r_y1": 86.47699999999998, "r_x2": 499.556, "r_y2": 78.995, "r_x3": 53.286, "r_y3": 78.995, "coord_origin": "TOPLEFT"}, "text": "a. Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "orig": "a. Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "a. Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells"}, {"label": "table", "id": 8, "page_no": 7, "cluster": {"id": 8, "label": "table", "bbox": {"l": 53.62853240966797, "t": 218.94857788085938, "r": 298.5574951171875, "b": 292.39996337890625, "coord_origin": "TOPLEFT"}, "confidence": 0.8824009299278259, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.933, "r_y0": 226.00400000000002, "r_x1": 223.873, "r_y1": 226.00400000000002, "r_x2": 223.873, "r_y2": 221.35799999999995, "r_x3": 209.933, "r_y3": 221.35799999999995, "coord_origin": "TOPLEFT"}, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.765, "r_y0": 226.00400000000002, "r_x1": 273.058, "r_y1": 226.00400000000002, "r_x2": 273.058, "r_y2": 221.35799999999995, "r_x3": 263.765, "r_y3": 221.35799999999995, "coord_origin": "TOPLEFT"}, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.25, "r_y0": 233.49, "r_x1": 114.896, "r_y1": 233.49, "r_x2": 114.896, "r_y2": 228.84400000000005, "r_x3": 110.25, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.366, "r_y0": 233.49, "r_x1": 186.983, "r_y1": 233.49, "r_x2": 186.983, "r_y2": 228.84400000000005, "r_x3": 175.366, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u30d5\u30a1\u30a4\u30eb\u6570", "orig": "\u30d5\u30a1\u30a4\u30eb\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.314, "r_y0": 233.49, "r_x1": 199.961, "r_y1": 233.49, "r_x2": 199.961, "r_y2": 228.84400000000005, "r_x3": 195.314, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.198, "r_y0": 233.49, "r_x1": 236.168, "r_y1": 233.49, "r_x2": 236.168, "r_y2": 228.84400000000005, "r_x3": 229.198, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.114, "r_y0": 233.49, "r_x1": 260.761, "r_y1": 233.49, "r_x2": 260.761, "r_y2": 228.84400000000005, "r_x3": 256.114, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.384, "r_y0": 233.49, "r_x1": 285.354, "r_y1": 233.49, "r_x2": 285.354, "r_y2": 228.84400000000005, "r_x3": 278.384, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 240.76800000000003, "r_x1": 162.713, "r_y1": 240.76800000000003, "r_x2": 162.713, "r_y2": 236.48199999999997, "r_x3": 55.531, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.397, "r_y0": 240.76800000000003, "r_x1": 189.565, "r_y1": 240.76800000000003, "r_x2": 189.565, "r_y2": 236.48199999999997, "r_x3": 184.397, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.99, "r_y0": 240.76800000000003, "r_x1": 214.158, "r_y1": 240.76800000000003, "r_x2": 214.158, "r_y2": 236.48199999999997, "r_x3": 208.99, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.875, "r_y0": 240.76800000000003, "r_x1": 237.458, "r_y1": 240.76800000000003, "r_x2": 237.458, "r_y2": 236.48199999999997, "r_x3": 234.875, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 240.76800000000003, "r_x1": 264.636, "r_y1": 240.76800000000003, "r_x2": 264.636, "r_y2": 236.48199999999997, "r_x3": 256.884, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.061, "r_y0": 240.76800000000003, "r_x1": 286.644, "r_y1": 240.76800000000003, "r_x2": 286.644, "r_y2": 236.48199999999997, "r_x3": 284.061, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 246.962, "r_x1": 139.722, "r_y1": 246.962, "r_x2": 139.722, "r_y2": 242.67600000000004, "r_x3": 55.531, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 246.962, "r_x1": 190.857, "r_y1": 246.962, "r_x2": 190.857, "r_y2": 242.67600000000004, "r_x3": 183.105, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.698, "r_y0": 246.962, "r_x1": 215.45, "r_y1": 246.962, "r_x2": 215.45, "r_y2": 242.67600000000004, "r_x3": 207.698, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.875, "r_y0": 246.962, "r_x1": 237.458, "r_y1": 246.962, "r_x2": 237.458, "r_y2": 242.67600000000004, "r_x3": 234.875, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 246.962, "r_x1": 264.636, "r_y1": 246.962, "r_x2": 264.636, "r_y2": 242.67600000000004, "r_x3": 256.884, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.061, "r_y0": 246.962, "r_x1": 286.644, "r_y1": 246.962, "r_x2": 286.644, "r_y2": 242.67600000000004, "r_x3": 284.061, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 253.62199999999996, "r_x1": 74.118, "r_y1": 253.62199999999996, "r_x2": 74.118, "r_y2": 248.976, "r_x3": 55.531, "r_y3": 248.976, "coord_origin": "TOPLEFT"}, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.698, "r_y0": 253.93100000000004, "r_x1": 103.034, "r_y1": 253.93100000000004, "r_x2": 103.034, "r_y2": 249.64499999999998, "r_x3": 92.698, "r_y3": 249.64499999999998, "coord_origin": "TOPLEFT"}, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.034, "r_y0": 253.62199999999996, "r_x1": 114.651, "r_y1": 253.62199999999996, "r_x2": 114.651, "r_y2": 248.976, "r_x3": 103.034, "r_y3": 248.976, "coord_origin": "TOPLEFT"}, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 253.15700000000004, "r_x1": 190.857, "r_y1": 253.15700000000004, "r_x2": 190.857, "r_y2": 248.87099999999998, "r_x3": 183.105, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 253.15700000000004, "r_x1": 212.865, "r_y1": 253.15700000000004, "r_x2": 212.865, "r_y2": 248.87099999999998, "r_x3": 210.282, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 253.15700000000004, "r_x1": 240.043, "r_y1": 253.15700000000004, "r_x2": 240.043, "r_y2": 248.87099999999998, "r_x3": 232.292, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 253.15700000000004, "r_x1": 264.636, "r_y1": 253.15700000000004, "r_x2": 264.636, "r_y2": 248.87099999999998, "r_x3": 256.884, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 253.15700000000004, "r_x1": 289.229, "r_y1": 253.15700000000004, "r_x2": 289.229, "r_y2": 248.87099999999998, "r_x3": 281.477, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 261.10699999999997, "r_x1": 71.794, "r_y1": 261.10699999999997, "r_x2": 71.794, "r_y2": 256.461, "r_x3": 55.531, "r_y3": 256.461, "coord_origin": "TOPLEFT"}, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.053, "r_y0": 261.41600000000005, "r_x1": 93.22, "r_y1": 261.41600000000005, "r_x2": 93.22, "r_y2": 257.13, "r_x3": 88.053, "r_y3": 257.13, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.22, "r_y0": 261.10699999999997, "r_x1": 104.837, "r_y1": 261.10699999999997, "r_x2": 104.837, "r_y2": 256.461, "r_x3": 93.22, "r_y3": 256.461, "coord_origin": "TOPLEFT"}, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.451, "r_y0": 261.41600000000005, "r_x1": 129.882, "r_y1": 261.41600000000005, "r_x2": 129.882, "r_y2": 257.13, "r_x3": 116.451, "r_y3": 257.13, "coord_origin": "TOPLEFT"}, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 260.64200000000005, "r_x1": 190.857, "r_y1": 260.64200000000005, "r_x2": 190.857, "r_y2": 256.356, "r_x3": 183.105, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 260.64200000000005, "r_x1": 212.865, "r_y1": 260.64200000000005, "r_x2": 212.865, "r_y2": 256.356, "r_x3": 210.282, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 260.64200000000005, "r_x1": 240.043, "r_y1": 260.64200000000005, "r_x2": 240.043, "r_y2": 256.356, "r_x3": 232.292, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 260.64200000000005, "r_x1": 264.636, "r_y1": 260.64200000000005, "r_x2": 264.636, "r_y2": 256.356, "r_x3": 256.884, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 260.64200000000005, "r_x1": 289.229, "r_y1": 260.64200000000005, "r_x2": 289.229, "r_y2": 256.356, "r_x3": 281.477, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 268.33399999999995, "r_x1": 57.854, "r_y1": 268.33399999999995, "r_x2": 57.854, "r_y2": 263.688, "r_x3": 55.531, "r_y3": 263.688, "coord_origin": "TOPLEFT"}, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.177, "r_y0": 268.644, "r_x1": 65.344, "r_y1": 268.644, "r_x2": 65.344, "r_y2": 264.35699999999997, "r_x3": 60.177, "r_y3": 264.35699999999997, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.344, "r_y0": 268.33399999999995, "r_x1": 90.902, "r_y1": 268.33399999999995, "r_x2": 90.902, "r_y2": 263.688, "r_x3": 65.344, "r_y3": 263.688, "coord_origin": "TOPLEFT"}, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.451, "r_y0": 268.644, "r_x1": 129.882, "r_y1": 268.644, "r_x2": 129.882, "r_y2": 264.35699999999997, "r_x3": 116.451, "r_y3": 264.35699999999997, "coord_origin": "TOPLEFT"}, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 267.869, "r_x1": 190.857, "r_y1": 267.869, "r_x2": 190.857, "r_y2": 263.58299999999997, "r_x3": 183.105, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 267.869, "r_x1": 212.865, "r_y1": 267.869, "r_x2": 212.865, "r_y2": 263.58299999999997, "r_x3": 210.282, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 267.869, "r_x1": 240.043, "r_y1": 267.869, "r_x2": 240.043, "r_y2": 263.58299999999997, "r_x3": 232.292, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 267.869, "r_x1": 264.636, "r_y1": 267.869, "r_x2": 264.636, "r_y2": 263.58299999999997, "r_x3": 256.884, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 267.869, "r_x1": 289.229, "r_y1": 267.869, "r_x2": 289.229, "r_y2": 263.58299999999997, "r_x3": 281.477, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 275.562, "r_x1": 78.765, "r_y1": 275.562, "r_x2": 78.765, "r_y2": 270.91600000000005, "r_x3": 55.531, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.99, "r_y0": 275.871, "r_x1": 109.742, "r_y1": 275.871, "r_x2": 109.742, "r_y2": 271.58500000000004, "r_x3": 101.99, "r_y3": 271.58500000000004, "coord_origin": "TOPLEFT"}, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 109.742, "r_y0": 275.562, "r_x1": 112.065, "r_y1": 275.562, "r_x2": 112.065, "r_y2": 270.91600000000005, "r_x3": 109.742, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 114.388, "r_y0": 275.871, "r_x1": 122.139, "r_y1": 275.871, "r_x2": 122.139, "r_y2": 271.58500000000004, "r_x3": 114.388, "r_y3": 271.58500000000004, "coord_origin": "TOPLEFT"}, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.14, "r_y0": 275.562, "r_x1": 124.463, "r_y1": 275.562, "r_x2": 124.463, "r_y2": 270.91600000000005, "r_x3": 122.14, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.397, "r_y0": 275.096, "r_x1": 189.565, "r_y1": 275.096, "r_x2": 189.565, "r_y2": 270.80999999999995, "r_x3": 184.397, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 275.096, "r_x1": 212.865, "r_y1": 275.096, "r_x2": 212.865, "r_y2": 270.80999999999995, "r_x3": 210.282, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.583, "r_y0": 275.096, "r_x1": 238.751, "r_y1": 275.096, "r_x2": 238.751, "r_y2": 270.80999999999995, "r_x3": 233.583, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 275.096, "r_x1": 264.636, "r_y1": 275.096, "r_x2": 264.636, "r_y2": 270.80999999999995, "r_x3": 256.884, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 275.096, "r_x1": 289.229, "r_y1": 275.096, "r_x2": 289.229, "r_y2": 270.80999999999995, "r_x3": 281.477, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 283.356, "r_x1": 68.686, "r_y1": 283.356, "r_x2": 68.686, "r_y2": 279.07000000000005, "r_x3": 55.531, "r_y3": 279.07000000000005, "coord_origin": "TOPLEFT"}, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 68.686, "r_y0": 283.047, "r_x1": 87.273, "r_y1": 283.047, "r_x2": 87.273, "r_y2": 278.40099999999995, "r_x3": 68.686, "r_y3": 278.40099999999995, "coord_origin": "TOPLEFT"}, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 282.323, "r_x1": 190.857, "r_y1": 282.323, "r_x2": 190.857, "r_y2": 278.03700000000003, "r_x3": 183.105, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.99, "r_y0": 282.323, "r_x1": 214.158, "r_y1": 282.323, "r_x2": 214.158, "r_y2": 278.03700000000003, "r_x3": 208.99, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.583, "r_y0": 282.323, "r_x1": 238.751, "r_y1": 282.323, "r_x2": 238.751, "r_y2": 278.03700000000003, "r_x3": 233.583, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 282.323, "r_x1": 264.636, "r_y1": 282.323, "r_x2": 264.636, "r_y2": 278.03700000000003, "r_x3": 256.884, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.769, "r_y0": 282.323, "r_x1": 287.937, "r_y1": 282.323, "r_x2": 287.937, "r_y2": 278.03700000000003, "r_x3": 282.769, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.615, "r_y0": 290.274, "r_x1": 171.938, "r_y1": 290.274, "r_x2": 171.938, "r_y2": 285.628, "r_x3": 169.615, "r_y3": 285.628, "coord_origin": "TOPLEFT"}, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 289.809, "r_x1": 190.857, "r_y1": 289.809, "r_x2": 190.857, "r_y2": 285.522, "r_x3": 183.105, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.698, "r_y0": 289.809, "r_x1": 215.45, "r_y1": 289.809, "r_x2": 215.45, "r_y2": 285.522, "r_x3": 207.698, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 289.809, "r_x1": 240.043, "r_y1": 289.809, "r_x2": 240.043, "r_y2": 285.522, "r_x3": 232.292, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.765, "r_y0": 289.809, "r_x1": 265.752, "r_y1": 289.809, "r_x2": 265.752, "r_y2": 285.522, "r_x3": 255.765, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 289.809, "r_x1": 289.229, "r_y1": 289.809, "r_x2": 289.229, "r_y2": 285.522, "r_x3": 281.477, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 55, "label": "text", "bbox": {"l": 209.933, "t": 221.35799999999995, "r": 223.873, "b": 226.00400000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.933, "r_y0": 226.00400000000002, "r_x1": 223.873, "r_y1": 226.00400000000002, "r_x2": 223.873, "r_y2": 221.35799999999995, "r_x3": 209.933, "r_y3": 221.35799999999995, "coord_origin": "TOPLEFT"}, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 263.765, "t": 221.35799999999995, "r": 273.058, "b": 226.00400000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.765, "r_y0": 226.00400000000002, "r_x1": 273.058, "r_y1": 226.00400000000002, "r_x2": 273.058, "r_y2": 221.35799999999995, "r_x3": 263.765, "r_y3": 221.35799999999995, "coord_origin": "TOPLEFT"}, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 110.25, "t": 228.84400000000005, "r": 114.896, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.25, "r_y0": 233.49, "r_x1": 114.896, "r_y1": 233.49, "r_x2": 114.896, "r_y2": 228.84400000000005, "r_x3": 110.25, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 175.366, "t": 228.84400000000005, "r": 186.983, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.366, "r_y0": 233.49, "r_x1": 186.983, "r_y1": 233.49, "r_x2": 186.983, "r_y2": 228.84400000000005, "r_x3": 175.366, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u30d5\u30a1\u30a4\u30eb\u6570", "orig": "\u30d5\u30a1\u30a4\u30eb\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 195.314, "t": 228.84400000000005, "r": 199.961, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.314, "r_y0": 233.49, "r_x1": 199.961, "r_y1": 233.49, "r_x2": 199.961, "r_y2": 228.84400000000005, "r_x3": 195.314, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 229.198, "t": 228.84400000000005, "r": 236.168, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.198, "r_y0": 233.49, "r_x1": 236.168, "r_y1": 233.49, "r_x2": 236.168, "r_y2": 228.84400000000005, "r_x3": 229.198, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 256.114, "t": 228.84400000000005, "r": 260.761, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.114, "r_y0": 233.49, "r_x1": 260.761, "r_y1": 233.49, "r_x2": 260.761, "r_y2": 228.84400000000005, "r_x3": 256.114, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 278.384, "t": 228.84400000000005, "r": 285.354, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.384, "r_y0": 233.49, "r_x1": 285.354, "r_y1": 233.49, "r_x2": 285.354, "r_y2": 228.84400000000005, "r_x3": 278.384, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 55.531, "t": 236.48199999999997, "r": 162.713, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 240.76800000000003, "r_x1": 162.713, "r_y1": 240.76800000000003, "r_x2": 162.713, "r_y2": 236.48199999999997, "r_x3": 55.531, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 184.397, "t": 236.48199999999997, "r": 189.565, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.397, "r_y0": 240.76800000000003, "r_x1": 189.565, "r_y1": 240.76800000000003, "r_x2": 189.565, "r_y2": 236.48199999999997, "r_x3": 184.397, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 208.99, "t": 236.48199999999997, "r": 214.158, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.99, "r_y0": 240.76800000000003, "r_x1": 214.158, "r_y1": 240.76800000000003, "r_x2": 214.158, "r_y2": 236.48199999999997, "r_x3": 208.99, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 234.875, "t": 236.48199999999997, "r": 237.458, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.875, "r_y0": 240.76800000000003, "r_x1": 237.458, "r_y1": 240.76800000000003, "r_x2": 237.458, "r_y2": 236.48199999999997, "r_x3": 234.875, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 256.884, "t": 236.48199999999997, "r": 264.636, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 240.76800000000003, "r_x1": 264.636, "r_y1": 240.76800000000003, "r_x2": 264.636, "r_y2": 236.48199999999997, "r_x3": 256.884, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 284.061, "t": 236.48199999999997, "r": 286.644, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.061, "r_y0": 240.76800000000003, "r_x1": 286.644, "r_y1": 240.76800000000003, "r_x2": 286.644, "r_y2": 236.48199999999997, "r_x3": 284.061, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 55.531, "t": 242.67600000000004, "r": 139.722, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 246.962, "r_x1": 139.722, "r_y1": 246.962, "r_x2": 139.722, "r_y2": 242.67600000000004, "r_x3": 55.531, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 183.105, "t": 242.67600000000004, "r": 190.857, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 246.962, "r_x1": 190.857, "r_y1": 246.962, "r_x2": 190.857, "r_y2": 242.67600000000004, "r_x3": 183.105, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 207.698, "t": 242.67600000000004, "r": 215.45, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.698, "r_y0": 246.962, "r_x1": 215.45, "r_y1": 246.962, "r_x2": 215.45, "r_y2": 242.67600000000004, "r_x3": 207.698, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 234.875, "t": 242.67600000000004, "r": 237.458, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.875, "r_y0": 246.962, "r_x1": 237.458, "r_y1": 246.962, "r_x2": 237.458, "r_y2": 242.67600000000004, "r_x3": 234.875, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 256.884, "t": 242.67600000000004, "r": 264.636, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 246.962, "r_x1": 264.636, "r_y1": 246.962, "r_x2": 264.636, "r_y2": 242.67600000000004, "r_x3": 256.884, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 284.061, "t": 242.67600000000004, "r": 286.644, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.061, "r_y0": 246.962, "r_x1": 286.644, "r_y1": 246.962, "r_x2": 286.644, "r_y2": 242.67600000000004, "r_x3": 284.061, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 55.531, "t": 248.976, "r": 74.118, "b": 253.62199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 253.62199999999996, "r_x1": 74.118, "r_y1": 253.62199999999996, "r_x2": 74.118, "r_y2": 248.976, "r_x3": 55.531, "r_y3": 248.976, "coord_origin": "TOPLEFT"}, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 92.698, "t": 249.64499999999998, "r": 103.034, "b": 253.93100000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.698, "r_y0": 253.93100000000004, "r_x1": 103.034, "r_y1": 253.93100000000004, "r_x2": 103.034, "r_y2": 249.64499999999998, "r_x3": 92.698, "r_y3": 249.64499999999998, "coord_origin": "TOPLEFT"}, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 103.034, "t": 248.976, "r": 114.651, "b": 253.62199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.034, "r_y0": 253.62199999999996, "r_x1": 114.651, "r_y1": 253.62199999999996, "r_x2": 114.651, "r_y2": 248.976, "r_x3": 103.034, "r_y3": 248.976, "coord_origin": "TOPLEFT"}, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 183.105, "t": 248.87099999999998, "r": 190.857, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 253.15700000000004, "r_x1": 190.857, "r_y1": 253.15700000000004, "r_x2": 190.857, "r_y2": 248.87099999999998, "r_x3": 183.105, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 210.282, "t": 248.87099999999998, "r": 212.865, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 253.15700000000004, "r_x1": 212.865, "r_y1": 253.15700000000004, "r_x2": 212.865, "r_y2": 248.87099999999998, "r_x3": 210.282, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 232.292, "t": 248.87099999999998, "r": 240.043, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 253.15700000000004, "r_x1": 240.043, "r_y1": 253.15700000000004, "r_x2": 240.043, "r_y2": 248.87099999999998, "r_x3": 232.292, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 256.884, "t": 248.87099999999998, "r": 264.636, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 253.15700000000004, "r_x1": 264.636, "r_y1": 253.15700000000004, "r_x2": 264.636, "r_y2": 248.87099999999998, "r_x3": 256.884, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 82, "label": "text", "bbox": {"l": 281.477, "t": 248.87099999999998, "r": 289.229, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 253.15700000000004, "r_x1": 289.229, "r_y1": 253.15700000000004, "r_x2": 289.229, "r_y2": 248.87099999999998, "r_x3": 281.477, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 83, "label": "text", "bbox": {"l": 55.531, "t": 256.461, "r": 71.794, "b": 261.10699999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 261.10699999999997, "r_x1": 71.794, "r_y1": 261.10699999999997, "r_x2": 71.794, "r_y2": 256.461, "r_x3": 55.531, "r_y3": 256.461, "coord_origin": "TOPLEFT"}, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 88.053, "t": 257.13, "r": 93.22, "b": 261.41600000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.053, "r_y0": 261.41600000000005, "r_x1": 93.22, "r_y1": 261.41600000000005, "r_x2": 93.22, "r_y2": 257.13, "r_x3": 88.053, "r_y3": 257.13, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 93.22, "t": 256.461, "r": 104.837, "b": 261.10699999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.22, "r_y0": 261.10699999999997, "r_x1": 104.837, "r_y1": 261.10699999999997, "r_x2": 104.837, "r_y2": 256.461, "r_x3": 93.22, "r_y3": 256.461, "coord_origin": "TOPLEFT"}, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 86, "label": "text", "bbox": {"l": 116.451, "t": 257.13, "r": 129.882, "b": 261.41600000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.451, "r_y0": 261.41600000000005, "r_x1": 129.882, "r_y1": 261.41600000000005, "r_x2": 129.882, "r_y2": 257.13, "r_x3": 116.451, "r_y3": 257.13, "coord_origin": "TOPLEFT"}, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 183.105, "t": 256.356, "r": 190.857, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 260.64200000000005, "r_x1": 190.857, "r_y1": 260.64200000000005, "r_x2": 190.857, "r_y2": 256.356, "r_x3": 183.105, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 88, "label": "text", "bbox": {"l": 210.282, "t": 256.356, "r": 212.865, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 260.64200000000005, "r_x1": 212.865, "r_y1": 260.64200000000005, "r_x2": 212.865, "r_y2": 256.356, "r_x3": 210.282, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 232.292, "t": 256.356, "r": 240.043, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 260.64200000000005, "r_x1": 240.043, "r_y1": 260.64200000000005, "r_x2": 240.043, "r_y2": 256.356, "r_x3": 232.292, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 256.884, "t": 256.356, "r": 264.636, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 260.64200000000005, "r_x1": 264.636, "r_y1": 260.64200000000005, "r_x2": 264.636, "r_y2": 256.356, "r_x3": 256.884, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 91, "label": "text", "bbox": {"l": 281.477, "t": 256.356, "r": 289.229, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 260.64200000000005, "r_x1": 289.229, "r_y1": 260.64200000000005, "r_x2": 289.229, "r_y2": 256.356, "r_x3": 281.477, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 92, "label": "text", "bbox": {"l": 55.531, "t": 263.688, "r": 57.854, "b": 268.33399999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 268.33399999999995, "r_x1": 57.854, "r_y1": 268.33399999999995, "r_x2": 57.854, "r_y2": 263.688, "r_x3": 55.531, "r_y3": 263.688, "coord_origin": "TOPLEFT"}, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 93, "label": "text", "bbox": {"l": 60.177, "t": 264.35699999999997, "r": 65.344, "b": 268.644, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.177, "r_y0": 268.644, "r_x1": 65.344, "r_y1": 268.644, "r_x2": 65.344, "r_y2": 264.35699999999997, "r_x3": 60.177, "r_y3": 264.35699999999997, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 94, "label": "text", "bbox": {"l": 65.344, "t": 263.688, "r": 90.902, "b": 268.33399999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.344, "r_y0": 268.33399999999995, "r_x1": 90.902, "r_y1": 268.33399999999995, "r_x2": 90.902, "r_y2": 263.688, "r_x3": 65.344, "r_y3": 263.688, "coord_origin": "TOPLEFT"}, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 95, "label": "text", "bbox": {"l": 116.451, "t": 264.35699999999997, "r": 129.882, "b": 268.644, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.451, "r_y0": 268.644, "r_x1": 129.882, "r_y1": 268.644, "r_x2": 129.882, "r_y2": 264.35699999999997, "r_x3": 116.451, "r_y3": 264.35699999999997, "coord_origin": "TOPLEFT"}, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 96, "label": "text", "bbox": {"l": 183.105, "t": 263.58299999999997, "r": 190.857, "b": 267.869, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 267.869, "r_x1": 190.857, "r_y1": 267.869, "r_x2": 190.857, "r_y2": 263.58299999999997, "r_x3": 183.105, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 97, "label": "text", "bbox": {"l": 210.282, "t": 263.58299999999997, "r": 212.865, "b": 267.869, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 267.869, "r_x1": 212.865, "r_y1": 267.869, "r_x2": 212.865, "r_y2": 263.58299999999997, "r_x3": 210.282, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 98, "label": "text", "bbox": {"l": 232.292, "t": 263.58299999999997, "r": 240.043, "b": 267.869, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 267.869, "r_x1": 240.043, "r_y1": 267.869, "r_x2": 240.043, "r_y2": 263.58299999999997, "r_x3": 232.292, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 99, "label": "text", "bbox": {"l": 256.884, "t": 263.58299999999997, "r": 264.636, "b": 267.869, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 267.869, "r_x1": 264.636, "r_y1": 267.869, "r_x2": 264.636, "r_y2": 263.58299999999997, "r_x3": 256.884, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 100, "label": "text", "bbox": {"l": 281.477, "t": 263.58299999999997, "r": 289.229, "b": 267.869, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 267.869, "r_x1": 289.229, "r_y1": 267.869, "r_x2": 289.229, "r_y2": 263.58299999999997, "r_x3": 281.477, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 101, "label": "text", "bbox": {"l": 55.531, "t": 270.91600000000005, "r": 78.765, "b": 275.562, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 275.562, "r_x1": 78.765, "r_y1": 275.562, "r_x2": 78.765, "r_y2": 270.91600000000005, "r_x3": 55.531, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 102, "label": "text", "bbox": {"l": 101.99, "t": 271.58500000000004, "r": 109.742, "b": 275.871, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.99, "r_y0": 275.871, "r_x1": 109.742, "r_y1": 275.871, "r_x2": 109.742, "r_y2": 271.58500000000004, "r_x3": 101.99, "r_y3": 271.58500000000004, "coord_origin": "TOPLEFT"}, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 103, "label": "text", "bbox": {"l": 109.742, "t": 270.91600000000005, "r": 112.065, "b": 275.562, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 109.742, "r_y0": 275.562, "r_x1": 112.065, "r_y1": 275.562, "r_x2": 112.065, "r_y2": 270.91600000000005, "r_x3": 109.742, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 104, "label": "text", "bbox": {"l": 114.388, "t": 271.58500000000004, "r": 122.139, "b": 275.871, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 114.388, "r_y0": 275.871, "r_x1": 122.139, "r_y1": 275.871, "r_x2": 122.139, "r_y2": 271.58500000000004, "r_x3": 114.388, "r_y3": 271.58500000000004, "coord_origin": "TOPLEFT"}, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 105, "label": "text", "bbox": {"l": 122.14, "t": 270.91600000000005, "r": 124.463, "b": 275.562, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.14, "r_y0": 275.562, "r_x1": 124.463, "r_y1": 275.562, "r_x2": 124.463, "r_y2": 270.91600000000005, "r_x3": 122.14, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 106, "label": "text", "bbox": {"l": 184.397, "t": 270.80999999999995, "r": 189.565, "b": 275.096, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.397, "r_y0": 275.096, "r_x1": 189.565, "r_y1": 275.096, "r_x2": 189.565, "r_y2": 270.80999999999995, "r_x3": 184.397, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 107, "label": "text", "bbox": {"l": 210.282, "t": 270.80999999999995, "r": 212.865, "b": 275.096, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 275.096, "r_x1": 212.865, "r_y1": 275.096, "r_x2": 212.865, "r_y2": 270.80999999999995, "r_x3": 210.282, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 108, "label": "text", "bbox": {"l": 233.583, "t": 270.80999999999995, "r": 238.751, "b": 275.096, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.583, "r_y0": 275.096, "r_x1": 238.751, "r_y1": 275.096, "r_x2": 238.751, "r_y2": 270.80999999999995, "r_x3": 233.583, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 109, "label": "text", "bbox": {"l": 256.884, "t": 270.80999999999995, "r": 264.636, "b": 275.096, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 275.096, "r_x1": 264.636, "r_y1": 275.096, "r_x2": 264.636, "r_y2": 270.80999999999995, "r_x3": 256.884, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 110, "label": "text", "bbox": {"l": 281.477, "t": 270.80999999999995, "r": 289.229, "b": 275.096, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 275.096, "r_x1": 289.229, "r_y1": 275.096, "r_x2": 289.229, "r_y2": 270.80999999999995, "r_x3": 281.477, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 111, "label": "text", "bbox": {"l": 55.531, "t": 279.07000000000005, "r": 68.686, "b": 283.356, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 283.356, "r_x1": 68.686, "r_y1": 283.356, "r_x2": 68.686, "r_y2": 279.07000000000005, "r_x3": 55.531, "r_y3": 279.07000000000005, "coord_origin": "TOPLEFT"}, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 112, "label": "text", "bbox": {"l": 68.686, "t": 278.40099999999995, "r": 87.273, "b": 283.047, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 68.686, "r_y0": 283.047, "r_x1": 87.273, "r_y1": 283.047, "r_x2": 87.273, "r_y2": 278.40099999999995, "r_x3": 68.686, "r_y3": 278.40099999999995, "coord_origin": "TOPLEFT"}, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 113, "label": "text", "bbox": {"l": 183.105, "t": 278.03700000000003, "r": 190.857, "b": 282.323, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 282.323, "r_x1": 190.857, "r_y1": 282.323, "r_x2": 190.857, "r_y2": 278.03700000000003, "r_x3": 183.105, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 114, "label": "text", "bbox": {"l": 208.99, "t": 278.03700000000003, "r": 214.158, "b": 282.323, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.99, "r_y0": 282.323, "r_x1": 214.158, "r_y1": 282.323, "r_x2": 214.158, "r_y2": 278.03700000000003, "r_x3": 208.99, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 115, "label": "text", "bbox": {"l": 233.583, "t": 278.03700000000003, "r": 238.751, "b": 282.323, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.583, "r_y0": 282.323, "r_x1": 238.751, "r_y1": 282.323, "r_x2": 238.751, "r_y2": 278.03700000000003, "r_x3": 233.583, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 116, "label": "text", "bbox": {"l": 256.884, "t": 278.03700000000003, "r": 264.636, "b": 282.323, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 282.323, "r_x1": 264.636, "r_y1": 282.323, "r_x2": 264.636, "r_y2": 278.03700000000003, "r_x3": 256.884, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 117, "label": "text", "bbox": {"l": 282.769, "t": 278.03700000000003, "r": 287.937, "b": 282.323, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.769, "r_y0": 282.323, "r_x1": 287.937, "r_y1": 282.323, "r_x2": 287.937, "r_y2": 278.03700000000003, "r_x3": 282.769, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 118, "label": "text", "bbox": {"l": 169.615, "t": 285.628, "r": 171.938, "b": 290.274, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.615, "r_y0": 290.274, "r_x1": 171.938, "r_y1": 290.274, "r_x2": 171.938, "r_y2": 285.628, "r_x3": 169.615, "r_y3": 285.628, "coord_origin": "TOPLEFT"}, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 119, "label": "text", "bbox": {"l": 183.105, "t": 285.522, "r": 190.857, "b": 289.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 289.809, "r_x1": 190.857, "r_y1": 289.809, "r_x2": 190.857, "r_y2": 285.522, "r_x3": 183.105, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 120, "label": "text", "bbox": {"l": 207.698, "t": 285.522, "r": 215.45, "b": 289.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.698, "r_y0": 289.809, "r_x1": 215.45, "r_y1": 289.809, "r_x2": 215.45, "r_y2": 285.522, "r_x3": 207.698, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 121, "label": "text", "bbox": {"l": 232.292, "t": 285.522, "r": 240.043, "b": 289.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 289.809, "r_x1": 240.043, "r_y1": 289.809, "r_x2": 240.043, "r_y2": 285.522, "r_x3": 232.292, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 122, "label": "text", "bbox": {"l": 255.765, "t": 285.522, "r": 265.752, "b": 289.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.765, "r_y0": 289.809, "r_x1": 265.752, "r_y1": 289.809, "r_x2": 265.752, "r_y2": 285.522, "r_x3": 255.765, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 123, "label": "text", "bbox": {"l": 281.477, "t": 285.522, "r": 289.229, "b": 289.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 289.809, "r_x1": 289.229, "r_y1": 289.809, "r_x2": 289.229, "r_y2": 285.522, "r_x3": 281.477, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ched", "ched", "ched", "lcel", "ched", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 10, "num_cols": 6, "table_cells": [{"bbox": {"l": 209.933, "t": 221.35799999999995, "r": 223.873, "b": 226.00400000000002, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 4, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 263.765, "t": 221.35799999999995, "r": 273.058, "b": 226.00400000000002, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 6, "text": "\u53c2\u8003\u6587\u732e", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 110.25, "t": 228.84400000000005, "r": 114.896, "b": 233.49, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u51fa\u5178", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 175.366, "t": 228.84400000000005, "r": 199.961, "b": 233.49, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "\u30d5\u30a1\u30a4\u30eb\u6570 \u82f1\u8a9e", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 229.198, "t": 228.84400000000005, "r": 236.168, "b": 233.49, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "\u65e5\u672c\u8a9e", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 256.114, "t": 228.84400000000005, "r": 260.761, "b": 233.49, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "\u82f1\u8a9e", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 278.384, "t": 228.84400000000005, "r": 285.354, "b": 233.49, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "\u65e5\u672c\u8a9e", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 236.48199999999997, "r": 162.713, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Association for Computational Linguistics(ACL2003)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 184.397, "t": 236.48199999999997, "r": 189.565, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "65", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 208.99, "t": 236.48199999999997, "r": 214.158, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "65", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 234.875, "t": 236.48199999999997, "r": 237.458, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 236.48199999999997, "r": 264.636, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 284.061, "t": 236.48199999999997, "r": 286.644, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 242.67600000000004, "r": 139.722, "b": 246.962, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Computational Linguistics(COLING2002)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 183.105, "t": 242.67600000000004, "r": 190.857, "b": 246.962, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "140", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 207.698, "t": 242.67600000000004, "r": 215.45, "b": 246.962, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "140", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 234.875, "t": 242.67600000000004, "r": 237.458, "b": 246.962, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 242.67600000000004, "r": 264.636, "b": 246.962, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 284.061, "t": 242.67600000000004, "r": 286.644, "b": 246.962, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 248.976, "r": 114.651, "b": 253.93100000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a 2003 \u5e74\u7dcf\u5408\u5927\u4f1a", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 183.105, "t": 248.87099999999998, "r": 190.857, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "150", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 210.282, "t": 248.87099999999998, "r": 212.865, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "8", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 232.292, "t": 248.87099999999998, "r": 240.043, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "142", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 248.87099999999998, "r": 264.636, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "223", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 281.477, "t": 248.87099999999998, "r": 289.229, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "147", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 256.461, "r": 129.882, "b": 261.41600000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c 65 \u56de\u5168\u56fd\u5927\u4f1a (2003)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 183.105, "t": 256.356, "r": 190.857, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "177", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 210.282, "t": 256.356, "r": 212.865, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 232.292, "t": 256.356, "r": 240.043, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "176", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 256.356, "r": 264.636, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 281.477, "t": 256.356, "r": 289.229, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "236", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 263.688, "r": 129.882, "b": 268.644, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u7b2c 17 \u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a (2003)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 183.105, "t": 263.58299999999997, "r": 190.857, "b": 267.869, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "208", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 210.282, "t": 263.58299999999997, "r": 212.865, "b": 267.869, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "5", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 232.292, "t": 263.58299999999997, "r": 240.043, "b": 267.869, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "203", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 263.58299999999997, "r": 264.636, "b": 267.869, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "152", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 281.477, "t": 263.58299999999997, "r": 289.229, "b": 267.869, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "244", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 270.91600000000005, "r": 124.463, "b": 275.871, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c 146 \u301c 155 \u56de", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 184.397, "t": 270.80999999999995, "r": 189.565, "b": 275.096, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "98", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 210.282, "t": 270.80999999999995, "r": 212.865, "b": 275.096, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "2", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 233.583, "t": 270.80999999999995, "r": 238.751, "b": 275.096, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "96", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 270.80999999999995, "r": 264.636, "b": 275.096, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 281.477, "t": 270.80999999999995, "r": 289.229, "b": 275.096, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "232", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 278.40099999999995, "r": 87.273, "b": 283.356, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "WWW \u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 183.105, "t": 278.03700000000003, "r": 190.857, "b": 282.323, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "107", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 208.99, "t": 278.03700000000003, "r": 214.158, "b": 282.323, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "73", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 233.583, "t": 278.03700000000003, "r": 238.751, "b": 282.323, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "34", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 278.03700000000003, "r": 264.636, "b": 282.323, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "147", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 282.769, "t": 278.03700000000003, "r": 287.937, "b": 282.323, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "96", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 169.615, "t": 285.628, "r": 171.938, "b": 290.274, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u8a08", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 183.105, "t": 285.522, "r": 190.857, "b": 289.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "945", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 207.698, "t": 285.522, "r": 215.45, "b": 289.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "294", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 232.292, "t": 285.522, "r": 240.043, "b": 289.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "651", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 255.765, "t": 285.522, "r": 265.752, "b": 289.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "1122", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 281.477, "t": 285.522, "r": 289.229, "b": 289.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "955", "column_header": false, "row_header": false, "row_section": false}]}, {"label": "caption", "id": 16, "page_no": 7, "cluster": {"id": 16, "label": "caption", "bbox": {"l": 380.427, "t": 292.551, "r": 549.422, "b": 298.536, "coord_origin": "TOPLEFT"}, "confidence": 0.7499915957450867, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.427, "r_y0": 298.536, "r_x1": 549.422, "r_y1": 298.536, "r_x2": 549.422, "r_y2": 292.551, "r_x3": 380.427, "r_y3": 292.551, "coord_origin": "TOPLEFT"}, "text": "Text is aligned to match original for ease of viewing", "orig": "Text is aligned to match original for ease of viewing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Text is aligned to match original for ease of viewing"}, {"label": "table", "id": 7, "page_no": 7, "cluster": {"id": 7, "label": "table", "bbox": {"l": 304.9219970703125, "t": 218.51486206054688, "r": 550.2321166992188, "b": 287.90069580078125, "coord_origin": "TOPLEFT"}, "confidence": 0.8899767994880676, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.049, "r_y0": 226.67100000000005, "r_x1": 542.0, "r_y1": 226.67100000000005, "r_x2": 542.0, "r_y2": 221.68899999999996, "r_x3": 459.049, "r_y3": 221.68899999999996, "coord_origin": "TOPLEFT"}, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.822, "r_y0": 232.88099999999997, "r_x1": 507.226, "r_y1": 232.88099999999997, "r_x2": 507.226, "r_y2": 227.899, "r_x3": 493.822, "r_y3": 227.899, "coord_origin": "TOPLEFT"}, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.244, "r_y0": 241.79399999999998, "r_x1": 407.346, "r_y1": 241.79399999999998, "r_x2": 407.346, "r_y2": 236.812, "r_x3": 393.244, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.097, "r_y0": 226.62099999999998, "r_x1": 438.015, "r_y1": 226.62099999999998, "r_x2": 438.015, "r_y2": 221.639, "r_x3": 392.097, "r_y3": 221.639, "coord_origin": "TOPLEFT"}, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.183, "r_y0": 241.79399999999998, "r_x1": 440.988, "r_y1": 241.79399999999998, "r_x2": 440.988, "r_y2": 236.812, "r_x3": 427.183, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.383, "r_y0": 241.79399999999998, "r_x1": 482.485, "r_y1": 241.79399999999998, "r_x2": 482.485, "r_y2": 236.812, "r_x3": 468.383, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.926, "r_y0": 241.79399999999998, "r_x1": 530.73, "r_y1": 241.79399999999998, "r_x2": 530.73, "r_y2": 236.812, "r_x3": 516.926, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 249.65700000000004, "r_x1": 364.656, "r_y1": 249.65700000000004, "r_x2": 364.656, "r_y2": 244.67600000000004, "r_x3": 306.115, "r_y3": 244.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Nonvested on January 1", "orig": "Nonvested on January 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 249.96000000000004, "r_x1": 403.755, "r_y1": 249.96000000000004, "r_x2": 403.755, "r_y2": 244.97799999999995, "r_x3": 396.247, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "1.1", "orig": "1.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.818, "r_y0": 249.96000000000004, "r_x1": 437.327, "r_y1": 249.96000000000004, "r_x2": 437.327, "r_y2": 244.97799999999995, "r_x3": 429.818, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.529, "r_y0": 249.96000000000004, "r_x1": 483.55, "r_y1": 249.96000000000004, "r_x2": 483.55, "r_y2": 244.97799999999995, "r_x3": 465.529, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "90.10 $", "orig": "90.10 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.448, "r_y0": 249.96000000000004, "r_x1": 531.47, "r_y1": 249.96000000000004, "r_x2": 531.47, "r_y2": 244.97799999999995, "r_x3": 513.448, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 258.731, "r_x1": 325.627, "r_y1": 258.731, "r_x2": 325.627, "r_y2": 253.74900000000002, "r_x3": 306.115, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 258.731, "r_x1": 403.755, "r_y1": 258.731, "r_x2": 403.755, "r_y2": 253.74900000000002, "r_x3": 396.247, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.818, "r_y0": 258.731, "r_x1": 437.327, "r_y1": 258.731, "r_x2": 437.327, "r_y2": 253.74900000000002, "r_x3": 429.818, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.436, "r_y0": 258.731, "r_x1": 482.548, "r_y1": 258.731, "r_x2": 482.548, "r_y2": 253.74900000000002, "r_x3": 466.436, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 514.291, "r_y0": 258.731, "r_x1": 530.81, "r_y1": 258.731, "r_x2": 530.81, "r_y2": 253.74900000000002, "r_x3": 514.291, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 266.595, "r_x1": 322.629, "r_y1": 266.595, "r_x2": 322.629, "r_y2": 261.61300000000006, "r_x3": 306.115, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.432, "r_y0": 266.595, "r_x1": 405.536, "r_y1": 266.595, "r_x2": 405.536, "r_y2": 261.61300000000006, "r_x3": 394.432, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "(0.5)", "orig": "(0.5)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.702, "r_y0": 266.595, "r_x1": 438.806, "r_y1": 266.595, "r_x2": 438.806, "r_y2": 261.61300000000006, "r_x3": 427.702, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.555, "r_y0": 266.595, "r_x1": 482.07, "r_y1": 266.595, "r_x2": 482.07, "r_y2": 261.61300000000006, "r_x3": 468.555, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.019, "r_y0": 266.595, "r_x1": 529.534, "r_y1": 266.595, "r_x2": 529.534, "r_y2": 261.61300000000006, "r_x3": 516.019, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 274.688, "r_x1": 356.248, "r_y1": 274.688, "r_x2": 356.248, "r_y2": 269.706, "r_x3": 306.115, "r_y3": 269.706, "coord_origin": "TOPLEFT"}, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.432, "r_y0": 275.366, "r_x1": 405.536, "r_y1": 275.366, "r_x2": 405.536, "r_y2": 270.384, "r_x3": 394.432, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.028, "r_y0": 275.366, "r_x1": 436.428, "r_y1": 275.366, "r_x2": 436.428, "r_y2": 270.384, "r_x3": 431.028, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.831, "r_y0": 275.366, "r_x1": 482.35, "r_y1": 275.366, "r_x2": 482.35, "r_y2": 270.384, "r_x3": 465.831, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.019, "r_y0": 275.366, "r_x1": 529.534, "r_y1": 275.366, "r_x2": 529.534, "r_y2": 270.384, "r_x3": 516.019, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 283.532, "r_x1": 373.358, "r_y1": 283.532, "r_x2": 373.358, "r_y2": 278.55100000000004, "r_x3": 306.115, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 283.532, "r_x1": 403.755, "r_y1": 283.532, "r_x2": 403.755, "r_y2": 278.55100000000004, "r_x3": 396.247, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.516, "r_y0": 283.532, "r_x1": 437.025, "r_y1": 283.532, "r_x2": 437.025, "r_y2": 278.55100000000004, "r_x3": 429.516, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.714, "r_y0": 283.532, "r_x1": 484.74, "r_y1": 283.532, "r_x2": 484.74, "r_y2": 278.55100000000004, "r_x3": 463.714, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.995, "r_y0": 283.532, "r_x1": 534.02, "r_y1": 283.532, "r_x2": 534.02, "r_y2": 278.55100000000004, "r_x3": 512.995, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 124, "label": "text", "bbox": {"l": 459.049, "t": 221.68899999999996, "r": 542.0, "b": 226.67100000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.049, "r_y0": 226.67100000000005, "r_x1": 542.0, "r_y1": 226.67100000000005, "r_x2": 542.0, "r_y2": 221.68899999999996, "r_x3": 459.049, "r_y3": 221.68899999999996, "coord_origin": "TOPLEFT"}, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 125, "label": "text", "bbox": {"l": 493.822, "t": 227.899, "r": 507.226, "b": 232.88099999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.822, "r_y0": 232.88099999999997, "r_x1": 507.226, "r_y1": 232.88099999999997, "r_x2": 507.226, "r_y2": 227.899, "r_x3": 493.822, "r_y3": 227.899, "coord_origin": "TOPLEFT"}, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 126, "label": "text", "bbox": {"l": 393.244, "t": 236.812, "r": 407.346, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.244, "r_y0": 241.79399999999998, "r_x1": 407.346, "r_y1": 241.79399999999998, "r_x2": 407.346, "r_y2": 236.812, "r_x3": 393.244, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 127, "label": "text", "bbox": {"l": 392.097, "t": 221.639, "r": 438.015, "b": 226.62099999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.097, "r_y0": 226.62099999999998, "r_x1": 438.015, "r_y1": 226.62099999999998, "r_x2": 438.015, "r_y2": 221.639, "r_x3": 392.097, "r_y3": 221.639, "coord_origin": "TOPLEFT"}, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 128, "label": "text", "bbox": {"l": 427.183, "t": 236.812, "r": 440.988, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.183, "r_y0": 241.79399999999998, "r_x1": 440.988, "r_y1": 241.79399999999998, "r_x2": 440.988, "r_y2": 236.812, "r_x3": 427.183, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 129, "label": "text", "bbox": {"l": 468.383, "t": 236.812, "r": 482.485, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.383, "r_y0": 241.79399999999998, "r_x1": 482.485, "r_y1": 241.79399999999998, "r_x2": 482.485, "r_y2": 236.812, "r_x3": 468.383, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 130, "label": "text", "bbox": {"l": 516.926, "t": 236.812, "r": 530.73, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.926, "r_y0": 241.79399999999998, "r_x1": 530.73, "r_y1": 241.79399999999998, "r_x2": 530.73, "r_y2": 236.812, "r_x3": 516.926, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 131, "label": "text", "bbox": {"l": 306.115, "t": 244.67600000000004, "r": 364.656, "b": 249.65700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 249.65700000000004, "r_x1": 364.656, "r_y1": 249.65700000000004, "r_x2": 364.656, "r_y2": 244.67600000000004, "r_x3": 306.115, "r_y3": 244.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Nonvested on January 1", "orig": "Nonvested on January 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 132, "label": "text", "bbox": {"l": 396.247, "t": 244.97799999999995, "r": 403.755, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 249.96000000000004, "r_x1": 403.755, "r_y1": 249.96000000000004, "r_x2": 403.755, "r_y2": 244.97799999999995, "r_x3": 396.247, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "1.1", "orig": "1.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 133, "label": "text", "bbox": {"l": 429.818, "t": 244.97799999999995, "r": 437.327, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.818, "r_y0": 249.96000000000004, "r_x1": 437.327, "r_y1": 249.96000000000004, "r_x2": 437.327, "r_y2": 244.97799999999995, "r_x3": 429.818, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 134, "label": "text", "bbox": {"l": 465.529, "t": 244.97799999999995, "r": 483.55, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.529, "r_y0": 249.96000000000004, "r_x1": 483.55, "r_y1": 249.96000000000004, "r_x2": 483.55, "r_y2": 244.97799999999995, "r_x3": 465.529, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "90.10 $", "orig": "90.10 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 135, "label": "text", "bbox": {"l": 513.448, "t": 244.97799999999995, "r": 531.47, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.448, "r_y0": 249.96000000000004, "r_x1": 531.47, "r_y1": 249.96000000000004, "r_x2": 531.47, "r_y2": 244.97799999999995, "r_x3": 513.448, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 136, "label": "text", "bbox": {"l": 306.115, "t": 253.74900000000002, "r": 325.627, "b": 258.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 258.731, "r_x1": 325.627, "r_y1": 258.731, "r_x2": 325.627, "r_y2": 253.74900000000002, "r_x3": 306.115, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 137, "label": "text", "bbox": {"l": 396.247, "t": 253.74900000000002, "r": 403.755, "b": 258.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 258.731, "r_x1": 403.755, "r_y1": 258.731, "r_x2": 403.755, "r_y2": 253.74900000000002, "r_x3": 396.247, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 138, "label": "text", "bbox": {"l": 429.818, "t": 253.74900000000002, "r": 437.327, "b": 258.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.818, "r_y0": 258.731, "r_x1": 437.327, "r_y1": 258.731, "r_x2": 437.327, "r_y2": 253.74900000000002, "r_x3": 429.818, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 139, "label": "text", "bbox": {"l": 466.436, "t": 253.74900000000002, "r": 482.548, "b": 258.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.436, "r_y0": 258.731, "r_x1": 482.548, "r_y1": 258.731, "r_x2": 482.548, "r_y2": 253.74900000000002, "r_x3": 466.436, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 140, "label": "text", "bbox": {"l": 514.291, "t": 253.74900000000002, "r": 530.81, "b": 258.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 514.291, "r_y0": 258.731, "r_x1": 530.81, "r_y1": 258.731, "r_x2": 530.81, "r_y2": 253.74900000000002, "r_x3": 514.291, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 141, "label": "text", "bbox": {"l": 306.115, "t": 261.61300000000006, "r": 322.629, "b": 266.595, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 266.595, "r_x1": 322.629, "r_y1": 266.595, "r_x2": 322.629, "r_y2": 261.61300000000006, "r_x3": 306.115, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 142, "label": "text", "bbox": {"l": 394.432, "t": 261.61300000000006, "r": 405.536, "b": 266.595, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.432, "r_y0": 266.595, "r_x1": 405.536, "r_y1": 266.595, "r_x2": 405.536, "r_y2": 261.61300000000006, "r_x3": 394.432, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "(0.5)", "orig": "(0.5)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 143, "label": "text", "bbox": {"l": 427.702, "t": 261.61300000000006, "r": 438.806, "b": 266.595, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.702, "r_y0": 266.595, "r_x1": 438.806, "r_y1": 266.595, "r_x2": 438.806, "r_y2": 261.61300000000006, "r_x3": 427.702, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 144, "label": "text", "bbox": {"l": 468.555, "t": 261.61300000000006, "r": 482.07, "b": 266.595, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.555, "r_y0": 266.595, "r_x1": 482.07, "r_y1": 266.595, "r_x2": 482.07, "r_y2": 261.61300000000006, "r_x3": 468.555, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 145, "label": "text", "bbox": {"l": 516.019, "t": 261.61300000000006, "r": 529.534, "b": 266.595, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.019, "r_y0": 266.595, "r_x1": 529.534, "r_y1": 266.595, "r_x2": 529.534, "r_y2": 261.61300000000006, "r_x3": 516.019, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 146, "label": "text", "bbox": {"l": 306.115, "t": 269.706, "r": 356.248, "b": 274.688, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 274.688, "r_x1": 356.248, "r_y1": 274.688, "r_x2": 356.248, "r_y2": 269.706, "r_x3": 306.115, "r_y3": 269.706, "coord_origin": "TOPLEFT"}, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 147, "label": "text", "bbox": {"l": 394.432, "t": 270.384, "r": 405.536, "b": 275.366, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.432, "r_y0": 275.366, "r_x1": 405.536, "r_y1": 275.366, "r_x2": 405.536, "r_y2": 270.384, "r_x3": 394.432, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 148, "label": "text", "bbox": {"l": 431.028, "t": 270.384, "r": 436.428, "b": 275.366, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.028, "r_y0": 275.366, "r_x1": 436.428, "r_y1": 275.366, "r_x2": 436.428, "r_y2": 270.384, "r_x3": 431.028, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 149, "label": "text", "bbox": {"l": 465.831, "t": 270.384, "r": 482.35, "b": 275.366, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.831, "r_y0": 275.366, "r_x1": 482.35, "r_y1": 275.366, "r_x2": 482.35, "r_y2": 270.384, "r_x3": 465.831, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 150, "label": "text", "bbox": {"l": 516.019, "t": 270.384, "r": 529.534, "b": 275.366, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.019, "r_y0": 275.366, "r_x1": 529.534, "r_y1": 275.366, "r_x2": 529.534, "r_y2": 270.384, "r_x3": 516.019, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 151, "label": "text", "bbox": {"l": 306.115, "t": 278.55100000000004, "r": 373.358, "b": 283.532, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 283.532, "r_x1": 373.358, "r_y1": 283.532, "r_x2": 373.358, "r_y2": 278.55100000000004, "r_x3": 306.115, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 152, "label": "text", "bbox": {"l": 396.247, "t": 278.55100000000004, "r": 403.755, "b": 283.532, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 283.532, "r_x1": 403.755, "r_y1": 283.532, "r_x2": 403.755, "r_y2": 278.55100000000004, "r_x3": 396.247, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 153, "label": "text", "bbox": {"l": 429.516, "t": 278.55100000000004, "r": 437.025, "b": 283.532, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.516, "r_y0": 283.532, "r_x1": 437.025, "r_y1": 283.532, "r_x2": 437.025, "r_y2": 278.55100000000004, "r_x3": 429.516, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 154, "label": "text", "bbox": {"l": 463.714, "t": 278.55100000000004, "r": 484.74, "b": 283.532, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.714, "r_y0": 283.532, "r_x1": 484.74, "r_y1": 283.532, "r_x2": 484.74, "r_y2": 278.55100000000004, "r_x3": 463.714, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 155, "label": "text", "bbox": {"l": 512.995, "t": 278.55100000000004, "r": 534.02, "b": 283.532, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.995, "r_y0": 283.532, "r_x1": 534.02, "r_y1": 283.532, "r_x2": 534.02, "r_y2": 278.55100000000004, "r_x3": 512.995, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ecel", "ched", "lcel", "ched", "lcel", "nl", "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 7, "num_cols": 5, "table_cells": [{"bbox": {"l": 459.049, "t": 221.68899999999996, "r": 542.0, "b": 232.88099999999997, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 5, "text": "Weighted Average Grant Date Fair Value", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 393.244, "t": 236.812, "r": 407.346, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "RSUs", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 392.097, "t": 221.639, "r": 438.015, "b": 226.62099999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 3, "text": "Shares (in millions)", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 427.183, "t": 236.812, "r": 440.988, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "PSUs", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 468.383, "t": 236.812, "r": 482.485, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "RSUs", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 516.926, "t": 236.812, "r": 530.73, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PSUs", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 306.115, "t": 244.67600000000004, "r": 364.656, "b": 249.65700000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Nonvested on January 1", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 396.247, "t": 244.97799999999995, "r": 403.755, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "1.1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 429.818, "t": 244.97799999999995, "r": 437.327, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 465.529, "t": 244.97799999999995, "r": 483.55, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "90.10 $", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 513.448, "t": 244.97799999999995, "r": 531.47, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "$ 91.19", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 306.115, "t": 253.74900000000002, "r": 325.627, "b": 258.731, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Granted", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 396.247, "t": 253.74900000000002, "r": 403.755, "b": 258.731, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "0.5", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 429.818, "t": 253.74900000000002, "r": 437.327, "b": 258.731, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 466.436, "t": 253.74900000000002, "r": 482.548, "b": 258.731, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "117.44", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 514.291, "t": 253.74900000000002, "r": 530.81, "b": 258.731, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "122.41", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 306.115, "t": 261.61300000000006, "r": 322.629, "b": 266.595, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Vested", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 394.432, "t": 261.61300000000006, "r": 405.536, "b": 266.595, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "(0.5)", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 427.702, "t": 261.61300000000006, "r": 438.806, "b": 266.595, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "(0.1)", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 468.555, "t": 261.61300000000006, "r": 482.07, "b": 266.595, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "87.08", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 516.019, "t": 261.61300000000006, "r": 529.534, "b": 266.595, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "81.14", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 306.115, "t": 269.706, "r": 356.248, "b": 274.688, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Canceled or forfeited", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 394.432, "t": 270.384, "r": 405.536, "b": 275.366, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "(0.1)", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 431.028, "t": 270.384, "r": 436.428, "b": 275.366, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 465.831, "t": 270.384, "r": 482.35, "b": 275.366, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "102.01", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 516.019, "t": 270.384, "r": 529.534, "b": 275.366, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "92.18", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 306.115, "t": 278.55100000000004, "r": 373.358, "b": 283.532, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Nonvested on December 31", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 396.247, "t": 278.55100000000004, "r": 403.755, "b": 283.532, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "1.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 429.516, "t": 278.55100000000004, "r": 437.025, "b": 283.532, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 463.714, "t": 278.55100000000004, "r": 484.74, "b": 283.532, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "104.85 $", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 512.995, "t": 278.55100000000004, "r": 534.02, "b": 283.532, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "$ 104.51", "column_header": false, "row_header": false, "row_section": false}]}, {"label": "caption", "id": 6, "page_no": 7, "cluster": {"id": 6, "label": "caption", "bbox": {"l": 50.112, "t": 321.146, "r": 545.114, "b": 365.564, "coord_origin": "TOPLEFT"}, "confidence": 0.9140303134918213, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 329.698, "r_x1": 86.864, "r_y1": 329.698, "r_x2": 86.864, "r_y2": 321.146, "r_x3": 50.112, "r_y3": 321.146, "coord_origin": "TOPLEFT"}, "text": "Figure 5:", "orig": "Figure 5:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.918, "r_y0": 329.698, "r_x1": 545.114, "r_y1": 329.698, "r_x2": 545.114, "r_y2": 321.146, "r_x3": 93.918, "r_y3": 321.146, "coord_origin": "TOPLEFT"}, "text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 341.653, "r_x1": 545.114, "r_y1": 341.653, "r_x2": 545.114, "r_y2": 333.101, "r_x3": 50.112, "r_y3": 333.101, "coord_origin": "TOPLEFT"}, "text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 353.608, "r_x1": 545.114, "r_y1": 353.608, "r_x2": 545.114, "r_y2": 345.056, "r_x3": 50.112, "r_y3": 345.056, "coord_origin": "TOPLEFT"}, "text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 365.564, "r_x1": 139.795, "r_y1": 365.564, "r_x2": 139.795, "r_y2": 357.012, "r_x3": 50.112, "r_y3": 357.012, "coord_origin": "TOPLEFT"}, "text": "the FinTabNet dataset.", "orig": "the FinTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 5: One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from the FinTabNet dataset."}, {"label": "picture", "id": 12, "page_no": 7, "cluster": {"id": 12, "label": "picture", "bbox": {"l": 216.76925659179688, "t": 380.4906311035156, "r": 375.7829284667969, "b": 443.34698486328125, "coord_origin": "TOPLEFT"}, "confidence": 0.805853009223938, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.263, "r_y0": 386.393, "r_x1": 342.078, "r_y1": 386.393, "r_x2": 342.078, "r_y2": 381.96, "r_x3": 220.263, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 156, "label": "text", "bbox": {"l": 220.263, "t": 381.96, "r": 342.078, "b": 386.393, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.263, "r_y0": 386.393, "r_x1": 342.078, "r_y1": 386.393, "r_x2": 342.078, "r_y2": 381.96, "r_x3": 220.263, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 11, "page_no": 7, "cluster": {"id": 11, "label": "picture", "bbox": {"l": 51.736167907714844, "t": 380.48065185546875, "r": 211.83778381347656, "b": 443.6580810546875, "coord_origin": "TOPLEFT"}, "confidence": 0.8308426737785339, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.715, "r_y0": 386.393, "r_x1": 85.657, "r_y1": 386.393, "r_x2": 85.657, "r_y2": 381.96, "r_x3": 53.715, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 157, "label": "text", "bbox": {"l": 53.715, "t": 381.96, "r": 85.657, "b": 386.393, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.715, "r_y0": 386.393, "r_x1": 85.657, "r_y1": 386.393, "r_x2": 85.657, "r_y2": 381.96, "r_x3": 53.715, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 13, "page_no": 7, "cluster": {"id": 13, "label": "picture", "bbox": {"l": 383.1364440917969, "t": 381.2313232421875, "r": 542.1132202148438, "b": 442.7749328613281, "coord_origin": "TOPLEFT"}, "confidence": 0.7881615161895752, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 406.686, "r_x1": 443.699, "r_y1": 406.686, "r_x2": 443.699, "r_y2": 401.109, "r_x3": 437.379, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.332, "r_y0": 406.686, "r_x1": 456.651, "r_y1": 406.686, "r_x2": 456.651, "r_y2": 401.109, "r_x3": 450.332, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.285, "r_y0": 406.686, "r_x1": 469.604, "r_y1": 406.686, "r_x2": 469.604, "r_y2": 401.109, "r_x3": 463.285, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.237, "r_y0": 406.686, "r_x1": 482.557, "r_y1": 406.686, "r_x2": 482.557, "r_y2": 401.109, "r_x3": 476.237, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.19, "r_y0": 406.686, "r_x1": 495.509, "r_y1": 406.686, "r_x2": 495.509, "r_y2": 401.109, "r_x3": 489.19, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.143, "r_y0": 406.686, "r_x1": 508.462, "r_y1": 406.686, "r_x2": 508.462, "r_y2": 401.109, "r_x3": 502.143, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.095, "r_y0": 406.686, "r_x1": 521.414, "r_y1": 406.686, "r_x2": 521.414, "r_y2": 401.109, "r_x3": 515.095, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 417.172, "r_x1": 391.601, "r_y1": 417.172, "r_x2": 391.601, "r_y2": 411.594, "r_x3": 385.281, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 417.172, "r_x1": 404.843, "r_y1": 417.172, "r_x2": 404.843, "r_y2": 411.594, "r_x3": 398.523, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 417.172, "r_x1": 417.795, "r_y1": 417.172, "r_x2": 417.795, "r_y2": 411.594, "r_x3": 411.476, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 417.172, "r_x1": 443.699, "r_y1": 417.172, "r_x2": 443.699, "r_y2": 411.594, "r_x3": 437.379, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.332, "r_y0": 417.172, "r_x1": 456.651, "r_y1": 417.172, "r_x2": 456.651, "r_y2": 411.594, "r_x3": 450.332, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.285, "r_y0": 417.172, "r_x1": 469.604, "r_y1": 417.172, "r_x2": 469.604, "r_y2": 411.594, "r_x3": 463.285, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 427.203, "r_x1": 391.601, "r_y1": 427.203, "r_x2": 391.601, "r_y2": 421.626, "r_x3": 385.281, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 427.203, "r_x1": 404.843, "r_y1": 427.203, "r_x2": 404.843, "r_y2": 421.626, "r_x3": 398.523, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 427.203, "r_x1": 417.795, "r_y1": 427.203, "r_x2": 417.795, "r_y2": 421.626, "r_x3": 411.476, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.429, "r_y0": 427.203, "r_x1": 430.748, "r_y1": 427.203, "r_x2": 430.748, "r_y2": 421.626, "r_x3": 424.429, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.381, "r_y0": 427.203, "r_x1": 443.701, "r_y1": 427.203, "r_x2": 443.701, "r_y2": 421.626, "r_x3": 437.381, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.334, "r_y0": 427.203, "r_x1": 456.653, "r_y1": 427.203, "r_x2": 456.653, "r_y2": 421.626, "r_x3": 450.334, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.287, "r_y0": 427.203, "r_x1": 469.606, "r_y1": 427.203, "r_x2": 469.606, "r_y2": 421.626, "r_x3": 463.287, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.239, "r_y0": 427.203, "r_x1": 482.558, "r_y1": 427.203, "r_x2": 482.558, "r_y2": 421.626, "r_x3": 476.239, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.192, "r_y0": 427.203, "r_x1": 495.511, "r_y1": 427.203, "r_x2": 495.511, "r_y2": 421.626, "r_x3": 489.192, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.144, "r_y0": 427.203, "r_x1": 508.464, "r_y1": 427.203, "r_x2": 508.464, "r_y2": 421.626, "r_x3": 502.144, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.097, "r_y0": 427.203, "r_x1": 521.416, "r_y1": 427.203, "r_x2": 521.416, "r_y2": 421.626, "r_x3": 515.097, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.05, "r_y0": 427.203, "r_x1": 534.369, "r_y1": 427.203, "r_x2": 534.369, "r_y2": 421.626, "r_x3": 528.05, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 438.178, "r_x1": 391.601, "r_y1": 438.178, "r_x2": 391.601, "r_y2": 432.6, "r_x3": 385.281, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 438.178, "r_x1": 404.843, "r_y1": 438.178, "r_x2": 404.843, "r_y2": 432.6, "r_x3": 398.523, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 438.178, "r_x1": 417.795, "r_y1": 438.178, "r_x2": 417.795, "r_y2": 432.6, "r_x3": 411.476, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.429, "r_y0": 438.178, "r_x1": 430.748, "r_y1": 438.178, "r_x2": 430.748, "r_y2": 432.6, "r_x3": 424.429, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.381, "r_y0": 438.178, "r_x1": 443.701, "r_y1": 438.178, "r_x2": 443.701, "r_y2": 432.6, "r_x3": 437.381, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.334, "r_y0": 438.178, "r_x1": 456.653, "r_y1": 438.178, "r_x2": 456.653, "r_y2": 432.6, "r_x3": 450.334, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.287, "r_y0": 438.178, "r_x1": 469.606, "r_y1": 438.178, "r_x2": 469.606, "r_y2": 432.6, "r_x3": 463.287, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.239, "r_y0": 438.178, "r_x1": 482.558, "r_y1": 438.178, "r_x2": 482.558, "r_y2": 432.6, "r_x3": 476.239, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.192, "r_y0": 438.178, "r_x1": 495.511, "r_y1": 438.178, "r_x2": 495.511, "r_y2": 432.6, "r_x3": 489.192, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.144, "r_y0": 438.178, "r_x1": 508.464, "r_y1": 438.178, "r_x2": 508.464, "r_y2": 432.6, "r_x3": 502.144, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.097, "r_y0": 438.178, "r_x1": 521.416, "r_y1": 438.178, "r_x2": 521.416, "r_y2": 432.6, "r_x3": 515.097, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.05, "r_y0": 438.178, "r_x1": 534.369, "r_y1": 438.178, "r_x2": 534.369, "r_y2": 432.6, "r_x3": 528.05, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 395.333, "r_x1": 388.441, "r_y1": 395.333, "r_x2": 388.441, "r_y2": 389.756, "r_x3": 385.281, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 395.333, "r_x1": 401.683, "r_y1": 395.333, "r_x2": 401.683, "r_y2": 389.756, "r_x3": 398.523, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.475, "r_y0": 395.333, "r_x1": 414.635, "r_y1": 395.333, "r_x2": 414.635, "r_y2": 389.756, "r_x3": 411.475, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.427, "r_y0": 395.333, "r_x1": 427.587, "r_y1": 395.333, "r_x2": 427.587, "r_y2": 389.756, "r_x3": 424.427, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 395.333, "r_x1": 440.539, "r_y1": 395.333, "r_x2": 440.539, "r_y2": 389.756, "r_x3": 437.379, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.331, "r_y0": 395.333, "r_x1": 453.491, "r_y1": 395.333, "r_x2": 453.491, "r_y2": 389.756, "r_x3": 450.331, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.283, "r_y0": 395.333, "r_x1": 466.443, "r_y1": 395.333, "r_x2": 466.443, "r_y2": 389.756, "r_x3": 463.283, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.235, "r_y0": 395.333, "r_x1": 479.395, "r_y1": 395.333, "r_x2": 479.395, "r_y2": 389.756, "r_x3": 476.235, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.187, "r_y0": 395.333, "r_x1": 492.347, "r_y1": 395.333, "r_x2": 492.347, "r_y2": 389.756, "r_x3": 489.187, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.139, "r_y0": 395.333, "r_x1": 505.299, "r_y1": 395.333, "r_x2": 505.299, "r_y2": 389.756, "r_x3": 502.139, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.091, "r_y0": 395.333, "r_x1": 521.411, "r_y1": 395.333, "r_x2": 521.411, "r_y2": 389.756, "r_x3": 515.091, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.044, "r_y0": 395.333, "r_x1": 534.131, "r_y1": 395.333, "r_x2": 534.131, "r_y2": 389.756, "r_x3": 528.044, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 405.108, "r_x1": 391.601, "r_y1": 405.108, "r_x2": 391.601, "r_y2": 399.531, "r_x3": 385.281, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 405.108, "r_x1": 404.843, "r_y1": 405.108, "r_x2": 404.843, "r_y2": 399.531, "r_x3": 398.523, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 405.108, "r_x1": 417.795, "r_y1": 405.108, "r_x2": 417.795, "r_y2": 399.531, "r_x3": 411.476, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.427, "r_y0": 412.908, "r_x1": 430.746, "r_y1": 412.908, "r_x2": 430.746, "r_y2": 407.331, "r_x3": 424.427, "r_y3": 407.331, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.869, "r_y0": 417.128, "r_x1": 509.189, "r_y1": 417.128, "r_x2": 509.189, "r_y2": 411.55, "r_x3": 502.869, "r_y3": 411.55, "coord_origin": "TOPLEFT"}, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.354, "r_y0": 386.393, "r_x1": 430.993, "r_y1": 386.393, "r_x2": 430.993, "r_y2": 381.96, "r_x3": 384.354, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 158, "label": "text", "bbox": {"l": 437.379, "t": 401.109, "r": 443.699, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 406.686, "r_x1": 443.699, "r_y1": 406.686, "r_x2": 443.699, "r_y2": 401.109, "r_x3": 437.379, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 159, "label": "text", "bbox": {"l": 450.332, "t": 401.109, "r": 456.651, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.332, "r_y0": 406.686, "r_x1": 456.651, "r_y1": 406.686, "r_x2": 456.651, "r_y2": 401.109, "r_x3": 450.332, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 160, "label": "text", "bbox": {"l": 463.285, "t": 401.109, "r": 469.604, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.285, "r_y0": 406.686, "r_x1": 469.604, "r_y1": 406.686, "r_x2": 469.604, "r_y2": 401.109, "r_x3": 463.285, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 161, "label": "text", "bbox": {"l": 476.237, "t": 401.109, "r": 482.557, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.237, "r_y0": 406.686, "r_x1": 482.557, "r_y1": 406.686, "r_x2": 482.557, "r_y2": 401.109, "r_x3": 476.237, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 162, "label": "text", "bbox": {"l": 489.19, "t": 401.109, "r": 495.509, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.19, "r_y0": 406.686, "r_x1": 495.509, "r_y1": 406.686, "r_x2": 495.509, "r_y2": 401.109, "r_x3": 489.19, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 163, "label": "text", "bbox": {"l": 502.143, "t": 401.109, "r": 508.462, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.143, "r_y0": 406.686, "r_x1": 508.462, "r_y1": 406.686, "r_x2": 508.462, "r_y2": 401.109, "r_x3": 502.143, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 164, "label": "text", "bbox": {"l": 515.095, "t": 401.109, "r": 521.414, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.095, "r_y0": 406.686, "r_x1": 521.414, "r_y1": 406.686, "r_x2": 521.414, "r_y2": 401.109, "r_x3": 515.095, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 165, "label": "text", "bbox": {"l": 385.281, "t": 411.594, "r": 391.601, "b": 417.172, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 417.172, "r_x1": 391.601, "r_y1": 417.172, "r_x2": 391.601, "r_y2": 411.594, "r_x3": 385.281, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 166, "label": "text", "bbox": {"l": 398.523, "t": 411.594, "r": 404.843, "b": 417.172, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 417.172, "r_x1": 404.843, "r_y1": 417.172, "r_x2": 404.843, "r_y2": 411.594, "r_x3": 398.523, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 167, "label": "text", "bbox": {"l": 411.476, "t": 411.594, "r": 417.795, "b": 417.172, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 417.172, "r_x1": 417.795, "r_y1": 417.172, "r_x2": 417.795, "r_y2": 411.594, "r_x3": 411.476, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 168, "label": "text", "bbox": {"l": 437.379, "t": 411.594, "r": 443.699, "b": 417.172, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 417.172, "r_x1": 443.699, "r_y1": 417.172, "r_x2": 443.699, "r_y2": 411.594, "r_x3": 437.379, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 169, "label": "text", "bbox": {"l": 450.332, "t": 411.594, "r": 456.651, "b": 417.172, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.332, "r_y0": 417.172, "r_x1": 456.651, "r_y1": 417.172, "r_x2": 456.651, "r_y2": 411.594, "r_x3": 450.332, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 170, "label": "text", "bbox": {"l": 463.285, "t": 411.594, "r": 469.604, "b": 417.172, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.285, "r_y0": 417.172, "r_x1": 469.604, "r_y1": 417.172, "r_x2": 469.604, "r_y2": 411.594, "r_x3": 463.285, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 171, "label": "text", "bbox": {"l": 385.281, "t": 421.626, "r": 391.601, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 427.203, "r_x1": 391.601, "r_y1": 427.203, "r_x2": 391.601, "r_y2": 421.626, "r_x3": 385.281, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 172, "label": "text", "bbox": {"l": 398.523, "t": 421.626, "r": 404.843, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 427.203, "r_x1": 404.843, "r_y1": 427.203, "r_x2": 404.843, "r_y2": 421.626, "r_x3": 398.523, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 173, "label": "text", "bbox": {"l": 411.476, "t": 421.626, "r": 417.795, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 427.203, "r_x1": 417.795, "r_y1": 427.203, "r_x2": 417.795, "r_y2": 421.626, "r_x3": 411.476, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 174, "label": "text", "bbox": {"l": 424.429, "t": 421.626, "r": 430.748, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.429, "r_y0": 427.203, "r_x1": 430.748, "r_y1": 427.203, "r_x2": 430.748, "r_y2": 421.626, "r_x3": 424.429, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 175, "label": "text", "bbox": {"l": 437.381, "t": 421.626, "r": 443.701, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.381, "r_y0": 427.203, "r_x1": 443.701, "r_y1": 427.203, "r_x2": 443.701, "r_y2": 421.626, "r_x3": 437.381, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 176, "label": "text", "bbox": {"l": 450.334, "t": 421.626, "r": 456.653, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.334, "r_y0": 427.203, "r_x1": 456.653, "r_y1": 427.203, "r_x2": 456.653, "r_y2": 421.626, "r_x3": 450.334, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 177, "label": "text", "bbox": {"l": 463.287, "t": 421.626, "r": 469.606, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.287, "r_y0": 427.203, "r_x1": 469.606, "r_y1": 427.203, "r_x2": 469.606, "r_y2": 421.626, "r_x3": 463.287, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 178, "label": "text", "bbox": {"l": 476.239, "t": 421.626, "r": 482.558, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.239, "r_y0": 427.203, "r_x1": 482.558, "r_y1": 427.203, "r_x2": 482.558, "r_y2": 421.626, "r_x3": 476.239, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 179, "label": "text", "bbox": {"l": 489.192, "t": 421.626, "r": 495.511, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.192, "r_y0": 427.203, "r_x1": 495.511, "r_y1": 427.203, "r_x2": 495.511, "r_y2": 421.626, "r_x3": 489.192, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 180, "label": "text", "bbox": {"l": 502.144, "t": 421.626, "r": 508.464, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.144, "r_y0": 427.203, "r_x1": 508.464, "r_y1": 427.203, "r_x2": 508.464, "r_y2": 421.626, "r_x3": 502.144, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 181, "label": "text", "bbox": {"l": 515.097, "t": 421.626, "r": 521.416, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.097, "r_y0": 427.203, "r_x1": 521.416, "r_y1": 427.203, "r_x2": 521.416, "r_y2": 421.626, "r_x3": 515.097, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 182, "label": "text", "bbox": {"l": 528.05, "t": 421.626, "r": 534.369, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.05, "r_y0": 427.203, "r_x1": 534.369, "r_y1": 427.203, "r_x2": 534.369, "r_y2": 421.626, "r_x3": 528.05, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 183, "label": "text", "bbox": {"l": 385.281, "t": 432.6, "r": 391.601, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 438.178, "r_x1": 391.601, "r_y1": 438.178, "r_x2": 391.601, "r_y2": 432.6, "r_x3": 385.281, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 184, "label": "text", "bbox": {"l": 398.523, "t": 432.6, "r": 404.843, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 438.178, "r_x1": 404.843, "r_y1": 438.178, "r_x2": 404.843, "r_y2": 432.6, "r_x3": 398.523, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 185, "label": "text", "bbox": {"l": 411.476, "t": 432.6, "r": 417.795, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 438.178, "r_x1": 417.795, "r_y1": 438.178, "r_x2": 417.795, "r_y2": 432.6, "r_x3": 411.476, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 186, "label": "text", "bbox": {"l": 424.429, "t": 432.6, "r": 430.748, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.429, "r_y0": 438.178, "r_x1": 430.748, "r_y1": 438.178, "r_x2": 430.748, "r_y2": 432.6, "r_x3": 424.429, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 187, "label": "text", "bbox": {"l": 437.381, "t": 432.6, "r": 443.701, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.381, "r_y0": 438.178, "r_x1": 443.701, "r_y1": 438.178, "r_x2": 443.701, "r_y2": 432.6, "r_x3": 437.381, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 188, "label": "text", "bbox": {"l": 450.334, "t": 432.6, "r": 456.653, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.334, "r_y0": 438.178, "r_x1": 456.653, "r_y1": 438.178, "r_x2": 456.653, "r_y2": 432.6, "r_x3": 450.334, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 189, "label": "text", "bbox": {"l": 463.287, "t": 432.6, "r": 469.606, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.287, "r_y0": 438.178, "r_x1": 469.606, "r_y1": 438.178, "r_x2": 469.606, "r_y2": 432.6, "r_x3": 463.287, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 190, "label": "text", "bbox": {"l": 476.239, "t": 432.6, "r": 482.558, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.239, "r_y0": 438.178, "r_x1": 482.558, "r_y1": 438.178, "r_x2": 482.558, "r_y2": 432.6, "r_x3": 476.239, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 191, "label": "text", "bbox": {"l": 489.192, "t": 432.6, "r": 495.511, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.192, "r_y0": 438.178, "r_x1": 495.511, "r_y1": 438.178, "r_x2": 495.511, "r_y2": 432.6, "r_x3": 489.192, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 192, "label": "text", "bbox": {"l": 502.144, "t": 432.6, "r": 508.464, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.144, "r_y0": 438.178, "r_x1": 508.464, "r_y1": 438.178, "r_x2": 508.464, "r_y2": 432.6, "r_x3": 502.144, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 193, "label": "text", "bbox": {"l": 515.097, "t": 432.6, "r": 521.416, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.097, "r_y0": 438.178, "r_x1": 521.416, "r_y1": 438.178, "r_x2": 521.416, "r_y2": 432.6, "r_x3": 515.097, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 194, "label": "text", "bbox": {"l": 528.05, "t": 432.6, "r": 534.369, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.05, "r_y0": 438.178, "r_x1": 534.369, "r_y1": 438.178, "r_x2": 534.369, "r_y2": 432.6, "r_x3": 528.05, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 195, "label": "text", "bbox": {"l": 385.281, "t": 389.756, "r": 388.441, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 395.333, "r_x1": 388.441, "r_y1": 395.333, "r_x2": 388.441, "r_y2": 389.756, "r_x3": 385.281, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 196, "label": "text", "bbox": {"l": 398.523, "t": 389.756, "r": 401.683, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 395.333, "r_x1": 401.683, "r_y1": 395.333, "r_x2": 401.683, "r_y2": 389.756, "r_x3": 398.523, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 197, "label": "text", "bbox": {"l": 411.475, "t": 389.756, "r": 414.635, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.475, "r_y0": 395.333, "r_x1": 414.635, "r_y1": 395.333, "r_x2": 414.635, "r_y2": 389.756, "r_x3": 411.475, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 198, "label": "text", "bbox": {"l": 424.427, "t": 389.756, "r": 427.587, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.427, "r_y0": 395.333, "r_x1": 427.587, "r_y1": 395.333, "r_x2": 427.587, "r_y2": 389.756, "r_x3": 424.427, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 199, "label": "text", "bbox": {"l": 437.379, "t": 389.756, "r": 440.539, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 395.333, "r_x1": 440.539, "r_y1": 395.333, "r_x2": 440.539, "r_y2": 389.756, "r_x3": 437.379, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 200, "label": "text", "bbox": {"l": 450.331, "t": 389.756, "r": 453.491, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.331, "r_y0": 395.333, "r_x1": 453.491, "r_y1": 395.333, "r_x2": 453.491, "r_y2": 389.756, "r_x3": 450.331, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 201, "label": "text", "bbox": {"l": 463.283, "t": 389.756, "r": 466.443, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.283, "r_y0": 395.333, "r_x1": 466.443, "r_y1": 395.333, "r_x2": 466.443, "r_y2": 389.756, "r_x3": 463.283, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 202, "label": "text", "bbox": {"l": 476.235, "t": 389.756, "r": 479.395, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.235, "r_y0": 395.333, "r_x1": 479.395, "r_y1": 395.333, "r_x2": 479.395, "r_y2": 389.756, "r_x3": 476.235, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 203, "label": "text", "bbox": {"l": 489.187, "t": 389.756, "r": 492.347, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.187, "r_y0": 395.333, "r_x1": 492.347, "r_y1": 395.333, "r_x2": 492.347, "r_y2": 389.756, "r_x3": 489.187, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 204, "label": "text", "bbox": {"l": 502.139, "t": 389.756, "r": 505.299, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.139, "r_y0": 395.333, "r_x1": 505.299, "r_y1": 395.333, "r_x2": 505.299, "r_y2": 389.756, "r_x3": 502.139, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 205, "label": "text", "bbox": {"l": 515.091, "t": 389.756, "r": 521.411, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.091, "r_y0": 395.333, "r_x1": 521.411, "r_y1": 395.333, "r_x2": 521.411, "r_y2": 389.756, "r_x3": 515.091, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 206, "label": "text", "bbox": {"l": 528.044, "t": 389.756, "r": 534.131, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.044, "r_y0": 395.333, "r_x1": 534.131, "r_y1": 395.333, "r_x2": 534.131, "r_y2": 389.756, "r_x3": 528.044, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 207, "label": "text", "bbox": {"l": 385.281, "t": 399.531, "r": 391.601, "b": 405.108, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 405.108, "r_x1": 391.601, "r_y1": 405.108, "r_x2": 391.601, "r_y2": 399.531, "r_x3": 385.281, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 208, "label": "text", "bbox": {"l": 398.523, "t": 399.531, "r": 404.843, "b": 405.108, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 405.108, "r_x1": 404.843, "r_y1": 405.108, "r_x2": 404.843, "r_y2": 399.531, "r_x3": 398.523, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 209, "label": "text", "bbox": {"l": 411.476, "t": 399.531, "r": 417.795, "b": 405.108, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 405.108, "r_x1": 417.795, "r_y1": 405.108, "r_x2": 417.795, "r_y2": 399.531, "r_x3": 411.476, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 210, "label": "text", "bbox": {"l": 424.427, "t": 407.331, "r": 430.746, "b": 412.908, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.427, "r_y0": 412.908, "r_x1": 430.746, "r_y1": 412.908, "r_x2": 430.746, "r_y2": 407.331, "r_x3": 424.427, "r_y3": 407.331, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 211, "label": "text", "bbox": {"l": 502.869, "t": 411.55, "r": 509.189, "b": 417.128, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.869, "r_y0": 417.128, "r_x1": 509.189, "r_y1": 417.128, "r_x2": 509.189, "r_y2": 411.55, "r_x3": 502.869, "r_y3": 411.55, "coord_origin": "TOPLEFT"}, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 212, "label": "text", "bbox": {"l": 384.354, "t": 381.96, "r": 430.993, "b": 386.393, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.354, "r_y0": 386.393, "r_x1": 430.993, "r_y1": 386.393, "r_x2": 430.993, "r_y2": 381.96, "r_x3": 384.354, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "caption", "id": 5, "page_no": 7, "cluster": {"id": 5, "label": "caption", "bbox": {"l": 62.595, "t": 458.997, "r": 532.63, "b": 467.549, "coord_origin": "TOPLEFT"}, "confidence": 0.9153602719306946, "cells": [{"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.595, "r_y0": 467.549, "r_x1": 98.849, "r_y1": 467.549, "r_x2": 98.849, "r_y2": 458.997, "r_x3": 62.595, "r_y3": 458.997, "coord_origin": "TOPLEFT"}, "text": "Figure 6:", "orig": "Figure 6:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 104.428, "r_y0": 467.549, "r_x1": 532.63, "r_y1": 467.549, "r_x2": 532.63, "r_y2": 458.997, "r_x3": 104.428, "r_y3": 458.997, "coord_origin": "TOPLEFT"}, "text": "An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "orig": "An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table."}, {"label": "section_header", "id": 2, "page_no": 7, "cluster": {"id": 2, "label": "section_header", "bbox": {"l": 50.112, "t": 491.395, "r": 163.756, "b": 501.247, "coord_origin": "TOPLEFT"}, "confidence": 0.9561247229576111, "cells": [{"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 501.247, "r_x1": 163.756, "r_y1": 501.247, "r_x2": 163.756, "r_y2": 491.395, "r_x3": 50.112, "r_y3": 491.395, "coord_origin": "TOPLEFT"}, "text": "5.5. Qualitative Analysis", "orig": "5.5. Qualitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.5. Qualitative Analysis"}, {"label": "text", "id": 1, "page_no": 7, "cluster": {"id": 1, "label": "text", "bbox": {"l": 50.112, "t": 537.142, "r": 286.365, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9852361679077148, "cells": [{"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 545.694, "r_x1": 118.505, "r_y1": 545.694, "r_x2": 118.505, "r_y2": 537.142, "r_x3": 62.067, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "We showcase", "orig": "We showcase", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 123.985, "r_y0": 545.694, "r_x1": 151.8, "r_y1": 545.694, "r_x2": 151.8, "r_y2": 537.142, "r_x3": 123.985, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "several", "orig": "several", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.28, "r_y0": 545.694, "r_x1": 212.074, "r_y1": 545.694, "r_x2": 212.074, "r_y2": 537.142, "r_x3": 157.28, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "visualizations", "orig": "visualizations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.553, "r_y0": 545.694, "r_x1": 229.17, "r_y1": 545.694, "r_x2": 229.17, "r_y2": 537.142, "r_x3": 217.553, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.659, "r_y0": 545.694, "r_x1": 246.833, "r_y1": 545.694, "r_x2": 246.833, "r_y2": 537.142, "r_x3": 234.659, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 252.313, "r_y0": 545.694, "r_x1": 286.365, "r_y1": 545.694, "r_x2": 286.365, "r_y2": 537.142, "r_x3": 252.313, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "different", "orig": "different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 557.649, "r_x1": 211.157, "r_y1": 557.649, "r_x2": 211.157, "r_y2": 549.097, "r_x3": 50.112, "r_y3": 549.097, "coord_origin": "TOPLEFT"}, "text": "components of our network on various", "orig": "components of our network on various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.1, "r_y0": 557.506, "r_x1": 259.175, "r_y1": 557.506, "r_x2": 259.175, "r_y2": 548.918, "r_x3": 215.1, "r_y3": 548.918, "coord_origin": "TOPLEFT"}, "text": "'complex'", "orig": "'complex'", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.12, "r_y0": 557.649, "r_x1": 286.363, "r_y1": 557.649, "r_x2": 286.363, "r_y2": 549.097, "r_x3": 263.12, "r_y3": 549.097, "coord_origin": "TOPLEFT"}, "text": "tables", "orig": "tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 569.604, "r_x1": 231.72, "r_y1": 569.604, "r_x2": 231.72, "r_y2": 561.052, "r_x3": 50.112, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "within datasets presented in this work in Fig.", "orig": "within datasets presented in this work in Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.064, "r_y0": 569.604, "r_x1": 277.03, "r_y1": 569.604, "r_x2": 277.03, "r_y2": 561.052, "r_x3": 236.064, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "5 and Fig.", "orig": "5 and Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.384, "r_y0": 569.604, "r_x1": 286.365, "r_y1": 569.604, "r_x2": 286.365, "r_y2": 561.052, "r_x3": 281.384, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 581.559, "r_x1": 286.365, "r_y1": 581.559, "r_x2": 286.365, "r_y2": 573.0070000000001, "r_x3": 50.112, "r_y3": 573.0070000000001, "coord_origin": "TOPLEFT"}, "text": "As it is shown, our model is able to predict bounding boxes", "orig": "As it is shown, our model is able to predict bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 593.514, "r_x1": 122.341, "r_y1": 593.514, "r_x2": 122.341, "r_y2": 584.962, "r_x3": 50.112, "r_y3": 584.962, "coord_origin": "TOPLEFT"}, "text": "for all table cells,", "orig": "for all table cells,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 126.107, "r_y0": 593.514, "r_x1": 228.004, "r_y1": 593.514, "r_x2": 228.004, "r_y2": 584.962, "r_x3": 126.107, "r_y3": 584.962, "coord_origin": "TOPLEFT"}, "text": "even for the empty ones.", "orig": "even for the empty ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.151, "r_y0": 593.514, "r_x1": 286.365, "r_y1": 593.514, "r_x2": 286.365, "r_y2": 584.962, "r_x3": 234.151, "r_y3": 584.962, "coord_origin": "TOPLEFT"}, "text": "Additionally,", "orig": "Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 605.47, "r_x1": 286.365, "r_y1": 605.47, "r_x2": 286.365, "r_y2": 596.918, "r_x3": 50.112, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "our post-processing techniques can extract the cell content", "orig": "our post-processing techniques can extract the cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 617.425, "r_x1": 286.365, "r_y1": 617.425, "r_x2": 286.365, "r_y2": 608.873, "r_x3": 50.112, "r_y3": 608.873, "coord_origin": "TOPLEFT"}, "text": "by matching the predicted bounding boxes to the PDF cells", "orig": "by matching the predicted bounding boxes to the PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 629.38, "r_x1": 230.873, "r_y1": 629.38, "r_x2": 230.873, "r_y2": 620.828, "r_x3": 50.112, "r_y3": 620.828, "coord_origin": "TOPLEFT"}, "text": "based on their overlap and spatial proximity.", "orig": "based on their overlap and spatial proximity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.855, "r_y0": 629.38, "r_x1": 286.365, "r_y1": 629.38, "r_x2": 286.365, "r_y2": 620.828, "r_x3": 235.855, "r_y3": 620.828, "coord_origin": "TOPLEFT"}, "text": "The left part", "orig": "The left part", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 641.335, "r_x1": 77.121, "r_y1": 641.335, "r_x2": 77.121, "r_y2": 632.783, "r_x3": 50.112, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "of Fig.", "orig": "of Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.544, "r_y0": 641.335, "r_x1": 286.365, "r_y1": 641.335, "r_x2": 286.365, "r_y2": 632.783, "r_x3": 81.544, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "5 demonstrates also the adaptability of our method", "orig": "5 demonstrates also the adaptability of our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 653.29, "r_x1": 57.863, "r_y1": 653.29, "r_x2": 57.863, "r_y2": 644.738, "r_x3": 50.112, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.436, "r_y0": 653.29, "r_x1": 119.691, "r_y1": 653.29, "r_x2": 119.691, "r_y2": 644.738, "r_x3": 62.436, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "any language,", "orig": "any language,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.782, "r_y0": 653.29, "r_x1": 133.081, "r_y1": 653.29, "r_x2": 133.081, "r_y2": 644.738, "r_x3": 124.782, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "as", "orig": "as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.653, "r_y0": 653.29, "r_x1": 143.193, "r_y1": 653.29, "r_x2": 143.193, "r_y2": 644.738, "r_x3": 137.653, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.765, "r_y0": 653.29, "r_x1": 214.854, "r_y1": 653.29, "r_x2": 214.854, "r_y2": 644.738, "r_x3": 147.765, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "can successfully", "orig": "can successfully", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.426, "r_y0": 653.29, "r_x1": 246.385, "r_y1": 653.29, "r_x2": 246.385, "r_y2": 644.738, "r_x3": 219.426, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "extract", "orig": "extract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.958, "r_y0": 653.29, "r_x1": 286.365, "r_y1": 653.29, "r_x2": 286.365, "r_y2": 644.738, "r_x3": 250.958, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "Japanese", "orig": "Japanese", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 665.245, "r_x1": 286.365, "r_y1": 665.245, "r_x2": 286.365, "r_y2": 656.693, "r_x3": 50.112, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "text, although the training set contains only English content.", "orig": "text, although the training set contains only English content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.201, "r_x1": 286.365, "r_y1": 677.201, "r_x2": 286.365, "r_y2": 668.649, "r_x3": 50.112, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "We provide more visualizations including the intermediate", "orig": "We provide more visualizations including the intermediate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 195.217, "r_y1": 689.156, "r_x2": 195.217, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "steps in the supplementary material.", "orig": "steps in the supplementary material.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 203, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.431, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 199.431, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "Overall these illustra-", "orig": "Overall these illustra-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 204, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "tions justify the versatility of our method across a diverse", "orig": "tions justify the versatility of our method across a diverse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 205, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 226.888, "r_y1": 713.066, "r_x2": 226.888, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "range of table appearances and content type.", "orig": "range of table appearances and content type.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We showcase several visualizations for the different components of our network on various 'complex' tables within datasets presented in this work in Fig. 5 and Fig. 6 As it is shown, our model is able to predict bounding boxes for all table cells, even for the empty ones. Additionally, our post-processing techniques can extract the cell content by matching the predicted bounding boxes to the PDF cells based on their overlap and spatial proximity. The left part of Fig. 5 demonstrates also the adaptability of our method to any language, as it can successfully extract Japanese text, although the training set contains only English content. We provide more visualizations including the intermediate steps in the supplementary material. Overall these illustrations justify the versatility of our method across a diverse range of table appearances and content type."}, {"label": "section_header", "id": 4, "page_no": 7, "cluster": {"id": 4, "label": "section_header", "bbox": {"l": 308.862, "t": 490.709, "r": 460.848, "b": 501.457, "coord_origin": "TOPLEFT"}, "confidence": 0.9436525702476501, "cells": [{"index": 206, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 501.457, "r_x1": 460.848, "r_y1": 501.457, "r_x2": 460.848, "r_y2": 490.709, "r_x3": 308.862, "r_y3": 490.709, "coord_origin": "TOPLEFT"}, "text": "6. Future Work &Conclusion", "orig": "6. Future Work &Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "6. Future Work &Conclusion"}, {"label": "text", "id": 0, "page_no": 7, "cluster": {"id": 0, "label": "text", "bbox": {"l": 308.862, "t": 513.162, "r": 545.115, "b": 653.22, "coord_origin": "TOPLEFT"}, "confidence": 0.9875594973564148, "cells": [{"index": 207, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 521.7139999999999, "r_x1": 545.115, "r_y1": 521.7139999999999, "r_x2": 545.115, "r_y2": 513.162, "r_x3": 320.817, "r_y3": 513.162, "coord_origin": "TOPLEFT"}, "text": "In this paper, we presented TableFormer an end-to-end", "orig": "In this paper, we presented TableFormer an end-to-end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 208, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.669, "r_x1": 545.115, "r_y1": 533.669, "r_x2": 545.115, "r_y2": 525.117, "r_x3": 308.862, "r_y3": 525.117, "coord_origin": "TOPLEFT"}, "text": "transformer based approach to predict table structures and", "orig": "transformer based approach to predict table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 209, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.624, "r_x1": 545.115, "r_y1": 545.624, "r_x2": 545.115, "r_y2": 537.072, "r_x3": 308.862, "r_y3": 537.072, "coord_origin": "TOPLEFT"}, "text": "bounding boxes of cells from an image. This approach en-", "orig": "bounding boxes of cells from an image. This approach en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 210, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 557.579, "r_x1": 545.115, "r_y1": 557.579, "r_x2": 545.115, "r_y2": 549.027, "r_x3": 308.862, "r_y3": 549.027, "coord_origin": "TOPLEFT"}, "text": "ables us to recreate the table structure, and extract the cell", "orig": "ables us to recreate the table structure, and extract the cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 211, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.534, "r_x1": 524.562, "r_y1": 569.534, "r_x2": 524.562, "r_y2": 560.982, "r_x3": 308.862, "r_y3": 560.982, "coord_origin": "TOPLEFT"}, "text": "content from PDF or OCR by using bounding boxes.", "orig": "content from PDF or OCR by using bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 212, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 529.623, "r_y0": 569.534, "r_x1": 545.115, "r_y1": 569.534, "r_x2": 545.115, "r_y2": 560.982, "r_x3": 529.623, "r_y3": 560.982, "coord_origin": "TOPLEFT"}, "text": "Ad-", "orig": "Ad-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 213, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 581.489, "r_x1": 545.115, "r_y1": 581.489, "r_x2": 545.115, "r_y2": 572.937, "r_x3": 308.862, "r_y3": 572.937, "coord_origin": "TOPLEFT"}, "text": "ditionally, it provides the versatility required in real-world", "orig": "ditionally, it provides the versatility required in real-world", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 214, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 593.4449999999999, "r_x1": 545.115, "r_y1": 593.4449999999999, "r_x2": 545.115, "r_y2": 584.893, "r_x3": 308.862, "r_y3": 584.893, "coord_origin": "TOPLEFT"}, "text": "scenarios when dealing with various types of PDF docu-", "orig": "scenarios when dealing with various types of PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 215, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.4, "r_x1": 335.153, "r_y1": 605.4, "r_x2": 335.153, "r_y2": 596.848, "r_x3": 308.862, "r_y3": 596.848, "coord_origin": "TOPLEFT"}, "text": "ments,", "orig": "ments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 216, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.656, "r_y0": 605.4, "r_x1": 400.468, "r_y1": 605.4, "r_x2": 400.468, "r_y2": 596.848, "r_x3": 339.656, "r_y3": 596.848, "coord_origin": "TOPLEFT"}, "text": "and languages.", "orig": "and languages.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 217, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.378, "r_y0": 605.4, "r_x1": 460.672, "r_y1": 605.4, "r_x2": 460.672, "r_y2": 596.848, "r_x3": 408.378, "r_y3": 596.848, "coord_origin": "TOPLEFT"}, "text": "Furthermore,", "orig": "Furthermore,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 218, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.175, "r_y0": 605.4, "r_x1": 545.115, "r_y1": 605.4, "r_x2": 545.115, "r_y2": 596.848, "r_x3": 465.175, "r_y3": 596.848, "coord_origin": "TOPLEFT"}, "text": "our method outper-", "orig": "our method outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 219, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.355, "r_x1": 495.471, "r_y1": 617.355, "r_x2": 495.471, "r_y2": 608.803, "r_x3": 308.862, "r_y3": 608.803, "coord_origin": "TOPLEFT"}, "text": "forms all state-of-the-arts with a wide margin.", "orig": "forms all state-of-the-arts with a wide margin.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 220, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.234, "r_y0": 617.355, "r_x1": 545.115, "r_y1": 617.355, "r_x2": 545.115, "r_y2": 608.803, "r_x3": 500.234, "r_y3": 608.803, "coord_origin": "TOPLEFT"}, "text": "Finally, we", "orig": "Finally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 221, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.31, "r_x1": 545.115, "r_y1": 629.31, "r_x2": 545.115, "r_y2": 620.758, "r_x3": 308.862, "r_y3": 620.758, "coord_origin": "TOPLEFT"}, "text": "introduce 'SynthTabNet' a challenging synthetically gen-", "orig": "introduce 'SynthTabNet' a challenging synthetically gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 222, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.265, "r_x1": 545.115, "r_y1": 641.265, "r_x2": 545.115, "r_y2": 632.713, "r_x3": 308.862, "r_y3": 632.713, "coord_origin": "TOPLEFT"}, "text": "erated dataset that reinforces missing characteristics from", "orig": "erated dataset that reinforces missing characteristics from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 223, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.22, "r_x1": 365.858, "r_y1": 653.22, "r_x2": 365.858, "r_y2": 644.668, "r_x3": 308.862, "r_y3": 644.668, "coord_origin": "TOPLEFT"}, "text": "other datasets.", "orig": "other datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In this paper, we presented TableFormer an end-to-end transformer based approach to predict table structures and bounding boxes of cells from an image. This approach enables us to recreate the table structure, and extract the cell content from PDF or OCR by using bounding boxes. Additionally, it provides the versatility required in real-world scenarios when dealing with various types of PDF documents, and languages. Furthermore, our method outperforms all state-of-the-arts with a wide margin. Finally, we introduce 'SynthTabNet' a challenging synthetically generated dataset that reinforces missing characteristics from other datasets."}, {"label": "section_header", "id": 3, "page_no": 7, "cluster": {"id": 3, "label": "section_header", "bbox": {"l": 308.862, "t": 672.099, "r": 364.406, "b": 682.847, "coord_origin": "TOPLEFT"}, "confidence": 0.9442470073699951, "cells": [{"index": 224, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 682.847, "r_x1": 364.406, "r_y1": 682.847, "r_x2": 364.406, "r_y2": 672.099, "r_x3": 308.862, "r_y3": 672.099, "coord_origin": "TOPLEFT"}, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "References"}, {"label": "list_item", "id": 10, "page_no": 7, "cluster": {"id": 10, "label": "list_item", "bbox": {"l": 313.345, "t": 694.204, "r": 545.113, "b": 712.86, "coord_origin": "TOPLEFT"}, "confidence": 0.8318753838539124, "cells": [{"index": 225, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.345, "r_y0": 701.901, "r_x1": 323.8, "r_y1": 701.901, "r_x2": 323.8, "r_y2": 694.204, "r_x3": 313.345, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "[1]", "orig": "[1]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 226, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 701.901, "r_x1": 545.109, "r_y1": 701.901, "r_x2": 545.109, "r_y2": 694.204, "r_x3": 328.785, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 227, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 712.86, "r_x1": 545.113, "r_y1": 712.86, "r_x2": 545.113, "r_y2": 705.163, "r_x3": 328.781, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[1] Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-"}, {"label": "page_footer", "id": 9, "page_no": 7, "cluster": {"id": 9, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8709858059883118, "cells": [{"index": 228, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "8"}, {"label": "picture", "id": 15, "page_no": 7, "cluster": {"id": 15, "label": "picture", "bbox": {"l": 305.5836486816406, "t": 98.65415954589844, "r": 554.8258666992188, "b": 180.6267547607422, "coord_origin": "TOPLEFT"}, "confidence": 0.7699173092842102, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 14, "page_no": 7, "cluster": {"id": 14, "label": "picture", "bbox": {"l": 49.97503662109375, "t": 103.71266174316406, "r": 301.6335754394531, "b": 187.5789337158203, "coord_origin": "TOPLEFT"}, "confidence": 0.7873926162719727, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}], "body": [{"label": "caption", "id": 18, "page_no": 7, "cluster": {"id": 18, "label": "caption", "bbox": {"l": 53.812, "t": 208.54100000000005, "r": 385.934, "b": 216.02300000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.5986505746841431, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.812, "r_y0": 216.02300000000002, "r_x1": 385.934, "r_y1": 216.02300000000002, "r_x2": 385.934, "r_y2": 208.54100000000005, "r_x3": 53.812, "r_y3": 208.54100000000005, "coord_origin": "TOPLEFT"}, "text": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:", "orig": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "b. Structure predicted by TableFormer, with superimposed matched PDF cell text:"}, {"label": "section_header", "id": 29, "page_no": 7, "cluster": {"id": 29, "label": "section_header", "bbox": {"l": 53.812, "t": 94.58900000000006, "r": 284.346, "b": 102.07100000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.46452972292900085, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.812, "r_y0": 102.07100000000003, "r_x1": 284.346, "r_y1": 102.07100000000003, "r_x2": 284.346, "r_y2": 94.58900000000006, "r_x3": 53.812, "r_y3": 94.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Japanese language (previously unseen by TableFormer):", "orig": "Japanese language (previously unseen by TableFormer):", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Japanese language (previously unseen by TableFormer):"}, {"label": "section_header", "id": 31, "page_no": 7, "cluster": {"id": 31, "label": "section_header", "bbox": {"l": 304.831, "t": 94.58900000000006, "r": 431.091, "b": 102.07100000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.4629225730895996, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 304.831, "r_y0": 102.07100000000003, "r_x1": 431.091, "r_y1": 102.07100000000003, "r_x2": 431.091, "r_y2": 94.58900000000006, "r_x3": 304.831, "r_y3": 94.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Example table from FinTabNet:", "orig": "Example table from FinTabNet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Example table from FinTabNet:"}, {"label": "list_item", "id": 21, "page_no": 7, "cluster": {"id": 21, "label": "list_item", "bbox": {"l": 53.286, "t": 78.995, "r": 499.556, "b": 86.47699999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.541211724281311, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.286, "r_y0": 86.47699999999998, "r_x1": 499.556, "r_y1": 86.47699999999998, "r_x2": 499.556, "r_y2": 78.995, "r_x3": 53.286, "r_y3": 78.995, "coord_origin": "TOPLEFT"}, "text": "a. Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "orig": "a. Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "a. Red - PDF cells, Green - predicted bounding boxes, Blue - post-processed predictions matched to PDF cells"}, {"label": "table", "id": 8, "page_no": 7, "cluster": {"id": 8, "label": "table", "bbox": {"l": 53.62853240966797, "t": 218.94857788085938, "r": 298.5574951171875, "b": 292.39996337890625, "coord_origin": "TOPLEFT"}, "confidence": 0.8824009299278259, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.933, "r_y0": 226.00400000000002, "r_x1": 223.873, "r_y1": 226.00400000000002, "r_x2": 223.873, "r_y2": 221.35799999999995, "r_x3": 209.933, "r_y3": 221.35799999999995, "coord_origin": "TOPLEFT"}, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.765, "r_y0": 226.00400000000002, "r_x1": 273.058, "r_y1": 226.00400000000002, "r_x2": 273.058, "r_y2": 221.35799999999995, "r_x3": 263.765, "r_y3": 221.35799999999995, "coord_origin": "TOPLEFT"}, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.25, "r_y0": 233.49, "r_x1": 114.896, "r_y1": 233.49, "r_x2": 114.896, "r_y2": 228.84400000000005, "r_x3": 110.25, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.366, "r_y0": 233.49, "r_x1": 186.983, "r_y1": 233.49, "r_x2": 186.983, "r_y2": 228.84400000000005, "r_x3": 175.366, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u30d5\u30a1\u30a4\u30eb\u6570", "orig": "\u30d5\u30a1\u30a4\u30eb\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.314, "r_y0": 233.49, "r_x1": 199.961, "r_y1": 233.49, "r_x2": 199.961, "r_y2": 228.84400000000005, "r_x3": 195.314, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.198, "r_y0": 233.49, "r_x1": 236.168, "r_y1": 233.49, "r_x2": 236.168, "r_y2": 228.84400000000005, "r_x3": 229.198, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.114, "r_y0": 233.49, "r_x1": 260.761, "r_y1": 233.49, "r_x2": 260.761, "r_y2": 228.84400000000005, "r_x3": 256.114, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.384, "r_y0": 233.49, "r_x1": 285.354, "r_y1": 233.49, "r_x2": 285.354, "r_y2": 228.84400000000005, "r_x3": 278.384, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 240.76800000000003, "r_x1": 162.713, "r_y1": 240.76800000000003, "r_x2": 162.713, "r_y2": 236.48199999999997, "r_x3": 55.531, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.397, "r_y0": 240.76800000000003, "r_x1": 189.565, "r_y1": 240.76800000000003, "r_x2": 189.565, "r_y2": 236.48199999999997, "r_x3": 184.397, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.99, "r_y0": 240.76800000000003, "r_x1": 214.158, "r_y1": 240.76800000000003, "r_x2": 214.158, "r_y2": 236.48199999999997, "r_x3": 208.99, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.875, "r_y0": 240.76800000000003, "r_x1": 237.458, "r_y1": 240.76800000000003, "r_x2": 237.458, "r_y2": 236.48199999999997, "r_x3": 234.875, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 240.76800000000003, "r_x1": 264.636, "r_y1": 240.76800000000003, "r_x2": 264.636, "r_y2": 236.48199999999997, "r_x3": 256.884, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.061, "r_y0": 240.76800000000003, "r_x1": 286.644, "r_y1": 240.76800000000003, "r_x2": 286.644, "r_y2": 236.48199999999997, "r_x3": 284.061, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 246.962, "r_x1": 139.722, "r_y1": 246.962, "r_x2": 139.722, "r_y2": 242.67600000000004, "r_x3": 55.531, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 246.962, "r_x1": 190.857, "r_y1": 246.962, "r_x2": 190.857, "r_y2": 242.67600000000004, "r_x3": 183.105, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.698, "r_y0": 246.962, "r_x1": 215.45, "r_y1": 246.962, "r_x2": 215.45, "r_y2": 242.67600000000004, "r_x3": 207.698, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.875, "r_y0": 246.962, "r_x1": 237.458, "r_y1": 246.962, "r_x2": 237.458, "r_y2": 242.67600000000004, "r_x3": 234.875, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 246.962, "r_x1": 264.636, "r_y1": 246.962, "r_x2": 264.636, "r_y2": 242.67600000000004, "r_x3": 256.884, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.061, "r_y0": 246.962, "r_x1": 286.644, "r_y1": 246.962, "r_x2": 286.644, "r_y2": 242.67600000000004, "r_x3": 284.061, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 253.62199999999996, "r_x1": 74.118, "r_y1": 253.62199999999996, "r_x2": 74.118, "r_y2": 248.976, "r_x3": 55.531, "r_y3": 248.976, "coord_origin": "TOPLEFT"}, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.698, "r_y0": 253.93100000000004, "r_x1": 103.034, "r_y1": 253.93100000000004, "r_x2": 103.034, "r_y2": 249.64499999999998, "r_x3": 92.698, "r_y3": 249.64499999999998, "coord_origin": "TOPLEFT"}, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.034, "r_y0": 253.62199999999996, "r_x1": 114.651, "r_y1": 253.62199999999996, "r_x2": 114.651, "r_y2": 248.976, "r_x3": 103.034, "r_y3": 248.976, "coord_origin": "TOPLEFT"}, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 253.15700000000004, "r_x1": 190.857, "r_y1": 253.15700000000004, "r_x2": 190.857, "r_y2": 248.87099999999998, "r_x3": 183.105, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 253.15700000000004, "r_x1": 212.865, "r_y1": 253.15700000000004, "r_x2": 212.865, "r_y2": 248.87099999999998, "r_x3": 210.282, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 253.15700000000004, "r_x1": 240.043, "r_y1": 253.15700000000004, "r_x2": 240.043, "r_y2": 248.87099999999998, "r_x3": 232.292, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 253.15700000000004, "r_x1": 264.636, "r_y1": 253.15700000000004, "r_x2": 264.636, "r_y2": 248.87099999999998, "r_x3": 256.884, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 253.15700000000004, "r_x1": 289.229, "r_y1": 253.15700000000004, "r_x2": 289.229, "r_y2": 248.87099999999998, "r_x3": 281.477, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 261.10699999999997, "r_x1": 71.794, "r_y1": 261.10699999999997, "r_x2": 71.794, "r_y2": 256.461, "r_x3": 55.531, "r_y3": 256.461, "coord_origin": "TOPLEFT"}, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.053, "r_y0": 261.41600000000005, "r_x1": 93.22, "r_y1": 261.41600000000005, "r_x2": 93.22, "r_y2": 257.13, "r_x3": 88.053, "r_y3": 257.13, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.22, "r_y0": 261.10699999999997, "r_x1": 104.837, "r_y1": 261.10699999999997, "r_x2": 104.837, "r_y2": 256.461, "r_x3": 93.22, "r_y3": 256.461, "coord_origin": "TOPLEFT"}, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.451, "r_y0": 261.41600000000005, "r_x1": 129.882, "r_y1": 261.41600000000005, "r_x2": 129.882, "r_y2": 257.13, "r_x3": 116.451, "r_y3": 257.13, "coord_origin": "TOPLEFT"}, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 260.64200000000005, "r_x1": 190.857, "r_y1": 260.64200000000005, "r_x2": 190.857, "r_y2": 256.356, "r_x3": 183.105, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 260.64200000000005, "r_x1": 212.865, "r_y1": 260.64200000000005, "r_x2": 212.865, "r_y2": 256.356, "r_x3": 210.282, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 260.64200000000005, "r_x1": 240.043, "r_y1": 260.64200000000005, "r_x2": 240.043, "r_y2": 256.356, "r_x3": 232.292, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 260.64200000000005, "r_x1": 264.636, "r_y1": 260.64200000000005, "r_x2": 264.636, "r_y2": 256.356, "r_x3": 256.884, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 260.64200000000005, "r_x1": 289.229, "r_y1": 260.64200000000005, "r_x2": 289.229, "r_y2": 256.356, "r_x3": 281.477, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 268.33399999999995, "r_x1": 57.854, "r_y1": 268.33399999999995, "r_x2": 57.854, "r_y2": 263.688, "r_x3": 55.531, "r_y3": 263.688, "coord_origin": "TOPLEFT"}, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.177, "r_y0": 268.644, "r_x1": 65.344, "r_y1": 268.644, "r_x2": 65.344, "r_y2": 264.35699999999997, "r_x3": 60.177, "r_y3": 264.35699999999997, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.344, "r_y0": 268.33399999999995, "r_x1": 90.902, "r_y1": 268.33399999999995, "r_x2": 90.902, "r_y2": 263.688, "r_x3": 65.344, "r_y3": 263.688, "coord_origin": "TOPLEFT"}, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.451, "r_y0": 268.644, "r_x1": 129.882, "r_y1": 268.644, "r_x2": 129.882, "r_y2": 264.35699999999997, "r_x3": 116.451, "r_y3": 264.35699999999997, "coord_origin": "TOPLEFT"}, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 267.869, "r_x1": 190.857, "r_y1": 267.869, "r_x2": 190.857, "r_y2": 263.58299999999997, "r_x3": 183.105, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 267.869, "r_x1": 212.865, "r_y1": 267.869, "r_x2": 212.865, "r_y2": 263.58299999999997, "r_x3": 210.282, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 267.869, "r_x1": 240.043, "r_y1": 267.869, "r_x2": 240.043, "r_y2": 263.58299999999997, "r_x3": 232.292, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 267.869, "r_x1": 264.636, "r_y1": 267.869, "r_x2": 264.636, "r_y2": 263.58299999999997, "r_x3": 256.884, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 267.869, "r_x1": 289.229, "r_y1": 267.869, "r_x2": 289.229, "r_y2": 263.58299999999997, "r_x3": 281.477, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 275.562, "r_x1": 78.765, "r_y1": 275.562, "r_x2": 78.765, "r_y2": 270.91600000000005, "r_x3": 55.531, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.99, "r_y0": 275.871, "r_x1": 109.742, "r_y1": 275.871, "r_x2": 109.742, "r_y2": 271.58500000000004, "r_x3": 101.99, "r_y3": 271.58500000000004, "coord_origin": "TOPLEFT"}, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 109.742, "r_y0": 275.562, "r_x1": 112.065, "r_y1": 275.562, "r_x2": 112.065, "r_y2": 270.91600000000005, "r_x3": 109.742, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 114.388, "r_y0": 275.871, "r_x1": 122.139, "r_y1": 275.871, "r_x2": 122.139, "r_y2": 271.58500000000004, "r_x3": 114.388, "r_y3": 271.58500000000004, "coord_origin": "TOPLEFT"}, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.14, "r_y0": 275.562, "r_x1": 124.463, "r_y1": 275.562, "r_x2": 124.463, "r_y2": 270.91600000000005, "r_x3": 122.14, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.397, "r_y0": 275.096, "r_x1": 189.565, "r_y1": 275.096, "r_x2": 189.565, "r_y2": 270.80999999999995, "r_x3": 184.397, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 275.096, "r_x1": 212.865, "r_y1": 275.096, "r_x2": 212.865, "r_y2": 270.80999999999995, "r_x3": 210.282, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.583, "r_y0": 275.096, "r_x1": 238.751, "r_y1": 275.096, "r_x2": 238.751, "r_y2": 270.80999999999995, "r_x3": 233.583, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 275.096, "r_x1": 264.636, "r_y1": 275.096, "r_x2": 264.636, "r_y2": 270.80999999999995, "r_x3": 256.884, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 275.096, "r_x1": 289.229, "r_y1": 275.096, "r_x2": 289.229, "r_y2": 270.80999999999995, "r_x3": 281.477, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 283.356, "r_x1": 68.686, "r_y1": 283.356, "r_x2": 68.686, "r_y2": 279.07000000000005, "r_x3": 55.531, "r_y3": 279.07000000000005, "coord_origin": "TOPLEFT"}, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 68.686, "r_y0": 283.047, "r_x1": 87.273, "r_y1": 283.047, "r_x2": 87.273, "r_y2": 278.40099999999995, "r_x3": 68.686, "r_y3": 278.40099999999995, "coord_origin": "TOPLEFT"}, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 282.323, "r_x1": 190.857, "r_y1": 282.323, "r_x2": 190.857, "r_y2": 278.03700000000003, "r_x3": 183.105, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.99, "r_y0": 282.323, "r_x1": 214.158, "r_y1": 282.323, "r_x2": 214.158, "r_y2": 278.03700000000003, "r_x3": 208.99, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.583, "r_y0": 282.323, "r_x1": 238.751, "r_y1": 282.323, "r_x2": 238.751, "r_y2": 278.03700000000003, "r_x3": 233.583, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 282.323, "r_x1": 264.636, "r_y1": 282.323, "r_x2": 264.636, "r_y2": 278.03700000000003, "r_x3": 256.884, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.769, "r_y0": 282.323, "r_x1": 287.937, "r_y1": 282.323, "r_x2": 287.937, "r_y2": 278.03700000000003, "r_x3": 282.769, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.615, "r_y0": 290.274, "r_x1": 171.938, "r_y1": 290.274, "r_x2": 171.938, "r_y2": 285.628, "r_x3": 169.615, "r_y3": 285.628, "coord_origin": "TOPLEFT"}, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 289.809, "r_x1": 190.857, "r_y1": 289.809, "r_x2": 190.857, "r_y2": 285.522, "r_x3": 183.105, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.698, "r_y0": 289.809, "r_x1": 215.45, "r_y1": 289.809, "r_x2": 215.45, "r_y2": 285.522, "r_x3": 207.698, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 289.809, "r_x1": 240.043, "r_y1": 289.809, "r_x2": 240.043, "r_y2": 285.522, "r_x3": 232.292, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.765, "r_y0": 289.809, "r_x1": 265.752, "r_y1": 289.809, "r_x2": 265.752, "r_y2": 285.522, "r_x3": 255.765, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 289.809, "r_x1": 289.229, "r_y1": 289.809, "r_x2": 289.229, "r_y2": 285.522, "r_x3": 281.477, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 55, "label": "text", "bbox": {"l": 209.933, "t": 221.35799999999995, "r": 223.873, "b": 226.00400000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.933, "r_y0": 226.00400000000002, "r_x1": 223.873, "r_y1": 226.00400000000002, "r_x2": 223.873, "r_y2": 221.35799999999995, "r_x3": 209.933, "r_y3": 221.35799999999995, "coord_origin": "TOPLEFT"}, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "orig": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 263.765, "t": 221.35799999999995, "r": 273.058, "b": 226.00400000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.765, "r_y0": 226.00400000000002, "r_x1": 273.058, "r_y1": 226.00400000000002, "r_x2": 273.058, "r_y2": 221.35799999999995, "r_x3": 263.765, "r_y3": 221.35799999999995, "coord_origin": "TOPLEFT"}, "text": "\u53c2\u8003\u6587\u732e", "orig": "\u53c2\u8003\u6587\u732e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 110.25, "t": 228.84400000000005, "r": 114.896, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.25, "r_y0": 233.49, "r_x1": 114.896, "r_y1": 233.49, "r_x2": 114.896, "r_y2": 228.84400000000005, "r_x3": 110.25, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u51fa\u5178", "orig": "\u51fa\u5178", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 175.366, "t": 228.84400000000005, "r": 186.983, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 175.366, "r_y0": 233.49, "r_x1": 186.983, "r_y1": 233.49, "r_x2": 186.983, "r_y2": 228.84400000000005, "r_x3": 175.366, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u30d5\u30a1\u30a4\u30eb\u6570", "orig": "\u30d5\u30a1\u30a4\u30eb\u6570", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 195.314, "t": 228.84400000000005, "r": 199.961, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.314, "r_y0": 233.49, "r_x1": 199.961, "r_y1": 233.49, "r_x2": 199.961, "r_y2": 228.84400000000005, "r_x3": 195.314, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 229.198, "t": 228.84400000000005, "r": 236.168, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.198, "r_y0": 233.49, "r_x1": 236.168, "r_y1": 233.49, "r_x2": 236.168, "r_y2": 228.84400000000005, "r_x3": 229.198, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 256.114, "t": 228.84400000000005, "r": 260.761, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.114, "r_y0": 233.49, "r_x1": 260.761, "r_y1": 233.49, "r_x2": 260.761, "r_y2": 228.84400000000005, "r_x3": 256.114, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u82f1\u8a9e", "orig": "\u82f1\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 278.384, "t": 228.84400000000005, "r": 285.354, "b": 233.49, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.384, "r_y0": 233.49, "r_x1": 285.354, "r_y1": 233.49, "r_x2": 285.354, "r_y2": 228.84400000000005, "r_x3": 278.384, "r_y3": 228.84400000000005, "coord_origin": "TOPLEFT"}, "text": "\u65e5\u672c\u8a9e", "orig": "\u65e5\u672c\u8a9e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 55.531, "t": 236.48199999999997, "r": 162.713, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 240.76800000000003, "r_x1": 162.713, "r_y1": 240.76800000000003, "r_x2": 162.713, "r_y2": 236.48199999999997, "r_x3": 55.531, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "Association for Computational Linguistics(ACL2003)", "orig": "Association for Computational Linguistics(ACL2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 184.397, "t": 236.48199999999997, "r": 189.565, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.397, "r_y0": 240.76800000000003, "r_x1": 189.565, "r_y1": 240.76800000000003, "r_x2": 189.565, "r_y2": 236.48199999999997, "r_x3": 184.397, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 208.99, "t": 236.48199999999997, "r": 214.158, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.99, "r_y0": 240.76800000000003, "r_x1": 214.158, "r_y1": 240.76800000000003, "r_x2": 214.158, "r_y2": 236.48199999999997, "r_x3": 208.99, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 234.875, "t": 236.48199999999997, "r": 237.458, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.875, "r_y0": 240.76800000000003, "r_x1": 237.458, "r_y1": 240.76800000000003, "r_x2": 237.458, "r_y2": 236.48199999999997, "r_x3": 234.875, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 256.884, "t": 236.48199999999997, "r": 264.636, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 240.76800000000003, "r_x1": 264.636, "r_y1": 240.76800000000003, "r_x2": 264.636, "r_y2": 236.48199999999997, "r_x3": 256.884, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 284.061, "t": 236.48199999999997, "r": 286.644, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.061, "r_y0": 240.76800000000003, "r_x1": 286.644, "r_y1": 240.76800000000003, "r_x2": 286.644, "r_y2": 236.48199999999997, "r_x3": 284.061, "r_y3": 236.48199999999997, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 55.531, "t": 242.67600000000004, "r": 139.722, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 246.962, "r_x1": 139.722, "r_y1": 246.962, "r_x2": 139.722, "r_y2": 242.67600000000004, "r_x3": 55.531, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Computational Linguistics(COLING2002)", "orig": "Computational Linguistics(COLING2002)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 183.105, "t": 242.67600000000004, "r": 190.857, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 246.962, "r_x1": 190.857, "r_y1": 246.962, "r_x2": 190.857, "r_y2": 242.67600000000004, "r_x3": 183.105, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 207.698, "t": 242.67600000000004, "r": 215.45, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.698, "r_y0": 246.962, "r_x1": 215.45, "r_y1": 246.962, "r_x2": 215.45, "r_y2": 242.67600000000004, "r_x3": 207.698, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "140", "orig": "140", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 234.875, "t": 242.67600000000004, "r": 237.458, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.875, "r_y0": 246.962, "r_x1": 237.458, "r_y1": 246.962, "r_x2": 237.458, "r_y2": 242.67600000000004, "r_x3": 234.875, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 256.884, "t": 242.67600000000004, "r": 264.636, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 246.962, "r_x1": 264.636, "r_y1": 246.962, "r_x2": 264.636, "r_y2": 242.67600000000004, "r_x3": 256.884, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 284.061, "t": 242.67600000000004, "r": 286.644, "b": 246.962, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 284.061, "r_y0": 246.962, "r_x1": 286.644, "r_y1": 246.962, "r_x2": 286.644, "r_y2": 242.67600000000004, "r_x3": 284.061, "r_y3": 242.67600000000004, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 55.531, "t": 248.976, "r": 74.118, "b": 253.62199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 253.62199999999996, "r_x1": 74.118, "r_y1": 253.62199999999996, "r_x2": 74.118, "r_y2": 248.976, "r_x3": 55.531, "r_y3": 248.976, "coord_origin": "TOPLEFT"}, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "orig": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 92.698, "t": 249.64499999999998, "r": 103.034, "b": 253.93100000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.698, "r_y0": 253.93100000000004, "r_x1": 103.034, "r_y1": 253.93100000000004, "r_x2": 103.034, "r_y2": 249.64499999999998, "r_x3": 92.698, "r_y3": 249.64499999999998, "coord_origin": "TOPLEFT"}, "text": "2003", "orig": "2003", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 103.034, "t": 248.976, "r": 114.651, "b": 253.62199999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.034, "r_y0": 253.62199999999996, "r_x1": 114.651, "r_y1": 253.62199999999996, "r_x2": 114.651, "r_y2": 248.976, "r_x3": 103.034, "r_y3": 248.976, "coord_origin": "TOPLEFT"}, "text": "\u5e74\u7dcf\u5408\u5927\u4f1a", "orig": "\u5e74\u7dcf\u5408\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 183.105, "t": 248.87099999999998, "r": 190.857, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 253.15700000000004, "r_x1": 190.857, "r_y1": 253.15700000000004, "r_x2": 190.857, "r_y2": 248.87099999999998, "r_x3": 183.105, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 210.282, "t": 248.87099999999998, "r": 212.865, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 253.15700000000004, "r_x1": 212.865, "r_y1": 253.15700000000004, "r_x2": 212.865, "r_y2": 248.87099999999998, "r_x3": 210.282, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 232.292, "t": 248.87099999999998, "r": 240.043, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 253.15700000000004, "r_x1": 240.043, "r_y1": 253.15700000000004, "r_x2": 240.043, "r_y2": 248.87099999999998, "r_x3": 232.292, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "142", "orig": "142", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 256.884, "t": 248.87099999999998, "r": 264.636, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 253.15700000000004, "r_x1": 264.636, "r_y1": 253.15700000000004, "r_x2": 264.636, "r_y2": 248.87099999999998, "r_x3": 256.884, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "223", "orig": "223", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 82, "label": "text", "bbox": {"l": 281.477, "t": 248.87099999999998, "r": 289.229, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 253.15700000000004, "r_x1": 289.229, "r_y1": 253.15700000000004, "r_x2": 289.229, "r_y2": 248.87099999999998, "r_x3": 281.477, "r_y3": 248.87099999999998, "coord_origin": "TOPLEFT"}, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 83, "label": "text", "bbox": {"l": 55.531, "t": 256.461, "r": 71.794, "b": 261.10699999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 261.10699999999997, "r_x1": 71.794, "r_y1": 261.10699999999997, "r_x2": 71.794, "r_y2": 256.461, "r_x3": 55.531, "r_y3": 256.461, "coord_origin": "TOPLEFT"}, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "orig": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 88.053, "t": 257.13, "r": 93.22, "b": 261.41600000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 88.053, "r_y0": 261.41600000000005, "r_x1": 93.22, "r_y1": 261.41600000000005, "r_x2": 93.22, "r_y2": 257.13, "r_x3": 88.053, "r_y3": 257.13, "coord_origin": "TOPLEFT"}, "text": "65", "orig": "65", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 93.22, "t": 256.461, "r": 104.837, "b": 261.10699999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.22, "r_y0": 261.10699999999997, "r_x1": 104.837, "r_y1": 261.10699999999997, "r_x2": 104.837, "r_y2": 256.461, "r_x3": 93.22, "r_y3": 256.461, "coord_origin": "TOPLEFT"}, "text": "\u56de\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 86, "label": "text", "bbox": {"l": 116.451, "t": 257.13, "r": 129.882, "b": 261.41600000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.451, "r_y0": 261.41600000000005, "r_x1": 129.882, "r_y1": 261.41600000000005, "r_x2": 129.882, "r_y2": 257.13, "r_x3": 116.451, "r_y3": 257.13, "coord_origin": "TOPLEFT"}, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 183.105, "t": 256.356, "r": 190.857, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 260.64200000000005, "r_x1": 190.857, "r_y1": 260.64200000000005, "r_x2": 190.857, "r_y2": 256.356, "r_x3": 183.105, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "177", "orig": "177", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 88, "label": "text", "bbox": {"l": 210.282, "t": 256.356, "r": 212.865, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 260.64200000000005, "r_x1": 212.865, "r_y1": 260.64200000000005, "r_x2": 212.865, "r_y2": 256.356, "r_x3": 210.282, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 232.292, "t": 256.356, "r": 240.043, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 260.64200000000005, "r_x1": 240.043, "r_y1": 260.64200000000005, "r_x2": 240.043, "r_y2": 256.356, "r_x3": 232.292, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "176", "orig": "176", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 256.884, "t": 256.356, "r": 264.636, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 260.64200000000005, "r_x1": 264.636, "r_y1": 260.64200000000005, "r_x2": 264.636, "r_y2": 256.356, "r_x3": 256.884, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 91, "label": "text", "bbox": {"l": 281.477, "t": 256.356, "r": 289.229, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 260.64200000000005, "r_x1": 289.229, "r_y1": 260.64200000000005, "r_x2": 289.229, "r_y2": 256.356, "r_x3": 281.477, "r_y3": 256.356, "coord_origin": "TOPLEFT"}, "text": "236", "orig": "236", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 92, "label": "text", "bbox": {"l": 55.531, "t": 263.688, "r": 57.854, "b": 268.33399999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 268.33399999999995, "r_x1": 57.854, "r_y1": 268.33399999999995, "r_x2": 57.854, "r_y2": 263.688, "r_x3": 55.531, "r_y3": 263.688, "coord_origin": "TOPLEFT"}, "text": "\u7b2c", "orig": "\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 93, "label": "text", "bbox": {"l": 60.177, "t": 264.35699999999997, "r": 65.344, "b": 268.644, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.177, "r_y0": 268.644, "r_x1": 65.344, "r_y1": 268.644, "r_x2": 65.344, "r_y2": 264.35699999999997, "r_x3": 60.177, "r_y3": 264.35699999999997, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 94, "label": "text", "bbox": {"l": 65.344, "t": 263.688, "r": 90.902, "b": 268.33399999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 65.344, "r_y0": 268.33399999999995, "r_x1": 90.902, "r_y1": 268.33399999999995, "r_x2": 90.902, "r_y2": 263.688, "r_x3": 65.344, "r_y3": 263.688, "coord_origin": "TOPLEFT"}, "text": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "orig": "\u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 95, "label": "text", "bbox": {"l": 116.451, "t": 264.35699999999997, "r": 129.882, "b": 268.644, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.451, "r_y0": 268.644, "r_x1": 129.882, "r_y1": 268.644, "r_x2": 129.882, "r_y2": 264.35699999999997, "r_x3": 116.451, "r_y3": 264.35699999999997, "coord_origin": "TOPLEFT"}, "text": "(2003)", "orig": "(2003)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 96, "label": "text", "bbox": {"l": 183.105, "t": 263.58299999999997, "r": 190.857, "b": 267.869, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 267.869, "r_x1": 190.857, "r_y1": 267.869, "r_x2": 190.857, "r_y2": 263.58299999999997, "r_x3": 183.105, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "208", "orig": "208", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 97, "label": "text", "bbox": {"l": 210.282, "t": 263.58299999999997, "r": 212.865, "b": 267.869, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 267.869, "r_x1": 212.865, "r_y1": 267.869, "r_x2": 212.865, "r_y2": 263.58299999999997, "r_x3": 210.282, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 98, "label": "text", "bbox": {"l": 232.292, "t": 263.58299999999997, "r": 240.043, "b": 267.869, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 267.869, "r_x1": 240.043, "r_y1": 267.869, "r_x2": 240.043, "r_y2": 263.58299999999997, "r_x3": 232.292, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "203", "orig": "203", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 99, "label": "text", "bbox": {"l": 256.884, "t": 263.58299999999997, "r": 264.636, "b": 267.869, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 267.869, "r_x1": 264.636, "r_y1": 267.869, "r_x2": 264.636, "r_y2": 263.58299999999997, "r_x3": 256.884, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "152", "orig": "152", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 100, "label": "text", "bbox": {"l": 281.477, "t": 263.58299999999997, "r": 289.229, "b": 267.869, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 267.869, "r_x1": 289.229, "r_y1": 267.869, "r_x2": 289.229, "r_y2": 263.58299999999997, "r_x3": 281.477, "r_y3": 263.58299999999997, "coord_origin": "TOPLEFT"}, "text": "244", "orig": "244", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 101, "label": "text", "bbox": {"l": 55.531, "t": 270.91600000000005, "r": 78.765, "b": 275.562, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 275.562, "r_x1": 78.765, "r_y1": 275.562, "r_x2": 78.765, "r_y2": 270.91600000000005, "r_x3": 55.531, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "orig": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 102, "label": "text", "bbox": {"l": 101.99, "t": 271.58500000000004, "r": 109.742, "b": 275.871, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.99, "r_y0": 275.871, "r_x1": 109.742, "r_y1": 275.871, "r_x2": 109.742, "r_y2": 271.58500000000004, "r_x3": 101.99, "r_y3": 271.58500000000004, "coord_origin": "TOPLEFT"}, "text": "146", "orig": "146", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 103, "label": "text", "bbox": {"l": 109.742, "t": 270.91600000000005, "r": 112.065, "b": 275.562, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 109.742, "r_y0": 275.562, "r_x1": 112.065, "r_y1": 275.562, "r_x2": 112.065, "r_y2": 270.91600000000005, "r_x3": 109.742, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u301c", "orig": "\u301c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 104, "label": "text", "bbox": {"l": 114.388, "t": 271.58500000000004, "r": 122.139, "b": 275.871, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 114.388, "r_y0": 275.871, "r_x1": 122.139, "r_y1": 275.871, "r_x2": 122.139, "r_y2": 271.58500000000004, "r_x3": 114.388, "r_y3": 271.58500000000004, "coord_origin": "TOPLEFT"}, "text": "155", "orig": "155", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 105, "label": "text", "bbox": {"l": 122.14, "t": 270.91600000000005, "r": 124.463, "b": 275.562, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.14, "r_y0": 275.562, "r_x1": 124.463, "r_y1": 275.562, "r_x2": 124.463, "r_y2": 270.91600000000005, "r_x3": 122.14, "r_y3": 270.91600000000005, "coord_origin": "TOPLEFT"}, "text": "\u56de", "orig": "\u56de", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 106, "label": "text", "bbox": {"l": 184.397, "t": 270.80999999999995, "r": 189.565, "b": 275.096, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.397, "r_y0": 275.096, "r_x1": 189.565, "r_y1": 275.096, "r_x2": 189.565, "r_y2": 270.80999999999995, "r_x3": 184.397, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "98", "orig": "98", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 107, "label": "text", "bbox": {"l": 210.282, "t": 270.80999999999995, "r": 212.865, "b": 275.096, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.282, "r_y0": 275.096, "r_x1": 212.865, "r_y1": 275.096, "r_x2": 212.865, "r_y2": 270.80999999999995, "r_x3": 210.282, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 108, "label": "text", "bbox": {"l": 233.583, "t": 270.80999999999995, "r": 238.751, "b": 275.096, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.583, "r_y0": 275.096, "r_x1": 238.751, "r_y1": 275.096, "r_x2": 238.751, "r_y2": 270.80999999999995, "r_x3": 233.583, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 109, "label": "text", "bbox": {"l": 256.884, "t": 270.80999999999995, "r": 264.636, "b": 275.096, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 275.096, "r_x1": 264.636, "r_y1": 275.096, "r_x2": 264.636, "r_y2": 270.80999999999995, "r_x3": 256.884, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "150", "orig": "150", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 110, "label": "text", "bbox": {"l": 281.477, "t": 270.80999999999995, "r": 289.229, "b": 275.096, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 275.096, "r_x1": 289.229, "r_y1": 275.096, "r_x2": 289.229, "r_y2": 270.80999999999995, "r_x3": 281.477, "r_y3": 270.80999999999995, "coord_origin": "TOPLEFT"}, "text": "232", "orig": "232", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 111, "label": "text", "bbox": {"l": 55.531, "t": 279.07000000000005, "r": 68.686, "b": 283.356, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 55.531, "r_y0": 283.356, "r_x1": 68.686, "r_y1": 283.356, "r_x2": 68.686, "r_y2": 279.07000000000005, "r_x3": 55.531, "r_y3": 279.07000000000005, "coord_origin": "TOPLEFT"}, "text": "WWW", "orig": "WWW", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 112, "label": "text", "bbox": {"l": 68.686, "t": 278.40099999999995, "r": 87.273, "b": 283.047, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 68.686, "r_y0": 283.047, "r_x1": 87.273, "r_y1": 283.047, "r_x2": 87.273, "r_y2": 278.40099999999995, "r_x3": 68.686, "r_y3": 278.40099999999995, "coord_origin": "TOPLEFT"}, "text": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "orig": "\u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 113, "label": "text", "bbox": {"l": 183.105, "t": 278.03700000000003, "r": 190.857, "b": 282.323, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 282.323, "r_x1": 190.857, "r_y1": 282.323, "r_x2": 190.857, "r_y2": 278.03700000000003, "r_x3": 183.105, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "107", "orig": "107", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 114, "label": "text", "bbox": {"l": 208.99, "t": 278.03700000000003, "r": 214.158, "b": 282.323, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.99, "r_y0": 282.323, "r_x1": 214.158, "r_y1": 282.323, "r_x2": 214.158, "r_y2": 278.03700000000003, "r_x3": 208.99, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "73", "orig": "73", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 115, "label": "text", "bbox": {"l": 233.583, "t": 278.03700000000003, "r": 238.751, "b": 282.323, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 233.583, "r_y0": 282.323, "r_x1": 238.751, "r_y1": 282.323, "r_x2": 238.751, "r_y2": 278.03700000000003, "r_x3": 233.583, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 116, "label": "text", "bbox": {"l": 256.884, "t": 278.03700000000003, "r": 264.636, "b": 282.323, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.884, "r_y0": 282.323, "r_x1": 264.636, "r_y1": 282.323, "r_x2": 264.636, "r_y2": 278.03700000000003, "r_x3": 256.884, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "147", "orig": "147", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 117, "label": "text", "bbox": {"l": 282.769, "t": 278.03700000000003, "r": 287.937, "b": 282.323, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 282.769, "r_y0": 282.323, "r_x1": 287.937, "r_y1": 282.323, "r_x2": 287.937, "r_y2": 278.03700000000003, "r_x3": 282.769, "r_y3": 278.03700000000003, "coord_origin": "TOPLEFT"}, "text": "96", "orig": "96", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 118, "label": "text", "bbox": {"l": 169.615, "t": 285.628, "r": 171.938, "b": 290.274, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 169.615, "r_y0": 290.274, "r_x1": 171.938, "r_y1": 290.274, "r_x2": 171.938, "r_y2": 285.628, "r_x3": 169.615, "r_y3": 285.628, "coord_origin": "TOPLEFT"}, "text": "\u8a08", "orig": "\u8a08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 119, "label": "text", "bbox": {"l": 183.105, "t": 285.522, "r": 190.857, "b": 289.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 183.105, "r_y0": 289.809, "r_x1": 190.857, "r_y1": 289.809, "r_x2": 190.857, "r_y2": 285.522, "r_x3": 183.105, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "945", "orig": "945", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 120, "label": "text", "bbox": {"l": 207.698, "t": 285.522, "r": 215.45, "b": 289.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.698, "r_y0": 289.809, "r_x1": 215.45, "r_y1": 289.809, "r_x2": 215.45, "r_y2": 285.522, "r_x3": 207.698, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "294", "orig": "294", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 121, "label": "text", "bbox": {"l": 232.292, "t": 285.522, "r": 240.043, "b": 289.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.292, "r_y0": 289.809, "r_x1": 240.043, "r_y1": 289.809, "r_x2": 240.043, "r_y2": 285.522, "r_x3": 232.292, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "651", "orig": "651", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 122, "label": "text", "bbox": {"l": 255.765, "t": 285.522, "r": 265.752, "b": 289.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 255.765, "r_y0": 289.809, "r_x1": 265.752, "r_y1": 289.809, "r_x2": 265.752, "r_y2": 285.522, "r_x3": 255.765, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "1122", "orig": "1122", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 123, "label": "text", "bbox": {"l": 281.477, "t": 285.522, "r": 289.229, "b": 289.809, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.477, "r_y0": 289.809, "r_x1": 289.229, "r_y1": 289.809, "r_x2": 289.229, "r_y2": 285.522, "r_x3": 281.477, "r_y3": 285.522, "coord_origin": "TOPLEFT"}, "text": "955", "orig": "955", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ched", "ched", "ched", "lcel", "ched", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 10, "num_cols": 6, "table_cells": [{"bbox": {"l": 209.933, "t": 221.35799999999995, "r": 223.873, "b": 226.00400000000002, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 2, "end_col_offset_idx": 4, "text": "\u8ad6\u6587\u30d5\u30a1\u30a4\u30eb", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 263.765, "t": 221.35799999999995, "r": 273.058, "b": 226.00400000000002, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 4, "end_col_offset_idx": 6, "text": "\u53c2\u8003\u6587\u732e", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 110.25, "t": 228.84400000000005, "r": 114.896, "b": 233.49, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u51fa\u5178", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 175.366, "t": 228.84400000000005, "r": 199.961, "b": 233.49, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "\u30d5\u30a1\u30a4\u30eb\u6570 \u82f1\u8a9e", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 229.198, "t": 228.84400000000005, "r": 236.168, "b": 233.49, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "\u65e5\u672c\u8a9e", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 256.114, "t": 228.84400000000005, "r": 260.761, "b": 233.49, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "\u82f1\u8a9e", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 278.384, "t": 228.84400000000005, "r": 285.354, "b": 233.49, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "\u65e5\u672c\u8a9e", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 236.48199999999997, "r": 162.713, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Association for Computational Linguistics(ACL2003)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 184.397, "t": 236.48199999999997, "r": 189.565, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "65", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 208.99, "t": 236.48199999999997, "r": 214.158, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "65", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 234.875, "t": 236.48199999999997, "r": 237.458, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 236.48199999999997, "r": 264.636, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 284.061, "t": 236.48199999999997, "r": 286.644, "b": 240.76800000000003, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 242.67600000000004, "r": 139.722, "b": 246.962, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Computational Linguistics(COLING2002)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 183.105, "t": 242.67600000000004, "r": 190.857, "b": 246.962, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "140", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 207.698, "t": 242.67600000000004, "r": 215.45, "b": 246.962, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "140", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 234.875, "t": 242.67600000000004, "r": 237.458, "b": 246.962, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 242.67600000000004, "r": 264.636, "b": 246.962, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 284.061, "t": 242.67600000000004, "r": 286.644, "b": 246.962, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 248.976, "r": 114.651, "b": 253.93100000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u96fb\u6c17\u60c5\u5831\u901a\u4fe1\u5b66\u4f1a 2003 \u5e74\u7dcf\u5408\u5927\u4f1a", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 183.105, "t": 248.87099999999998, "r": 190.857, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "150", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 210.282, "t": 248.87099999999998, "r": 212.865, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "8", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 232.292, "t": 248.87099999999998, "r": 240.043, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "142", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 248.87099999999998, "r": 264.636, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "223", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 281.477, "t": 248.87099999999998, "r": 289.229, "b": 253.15700000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "147", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 256.461, "r": 129.882, "b": 261.41600000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u60c5\u5831\u51e6\u7406\u5b66\u4f1a\u7b2c 65 \u56de\u5168\u56fd\u5927\u4f1a (2003)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 183.105, "t": 256.356, "r": 190.857, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "177", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 210.282, "t": 256.356, "r": 212.865, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 232.292, "t": 256.356, "r": 240.043, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "176", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 256.356, "r": 264.636, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 281.477, "t": 256.356, "r": 289.229, "b": 260.64200000000005, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "236", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 263.688, "r": 129.882, "b": 268.644, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u7b2c 17 \u56de\u4eba\u5de5\u77e5\u80fd\u5b66\u4f1a\u5168\u56fd\u5927\u4f1a (2003)", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 183.105, "t": 263.58299999999997, "r": 190.857, "b": 267.869, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "208", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 210.282, "t": 263.58299999999997, "r": 212.865, "b": 267.869, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "5", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 232.292, "t": 263.58299999999997, "r": 240.043, "b": 267.869, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "203", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 263.58299999999997, "r": 264.636, "b": 267.869, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "152", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 281.477, "t": 263.58299999999997, "r": 289.229, "b": 267.869, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "244", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 270.91600000000005, "r": 124.463, "b": 275.871, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406\u7814\u7a76\u4f1a\u7b2c 146 \u301c 155 \u56de", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 184.397, "t": 270.80999999999995, "r": 189.565, "b": 275.096, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "98", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 210.282, "t": 270.80999999999995, "r": 212.865, "b": 275.096, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "2", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 233.583, "t": 270.80999999999995, "r": 238.751, "b": 275.096, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "96", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 270.80999999999995, "r": 264.636, "b": 275.096, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "150", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 281.477, "t": 270.80999999999995, "r": 289.229, "b": 275.096, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 7, "end_row_offset_idx": 8, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "232", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 55.531, "t": 278.40099999999995, "r": 87.273, "b": 283.356, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "WWW \u304b\u3089\u53ce\u96c6\u3057\u305f\u8ad6\u6587", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 183.105, "t": 278.03700000000003, "r": 190.857, "b": 282.323, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "107", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 208.99, "t": 278.03700000000003, "r": 214.158, "b": 282.323, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "73", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 233.583, "t": 278.03700000000003, "r": 238.751, "b": 282.323, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "34", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 256.884, "t": 278.03700000000003, "r": 264.636, "b": 282.323, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "147", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 282.769, "t": 278.03700000000003, "r": 287.937, "b": 282.323, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 8, "end_row_offset_idx": 9, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "96", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 169.615, "t": 285.628, "r": 171.938, "b": 290.274, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "\u8a08", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 183.105, "t": 285.522, "r": 190.857, "b": 289.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "945", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 207.698, "t": 285.522, "r": 215.45, "b": 289.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "294", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 232.292, "t": 285.522, "r": 240.043, "b": 289.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "651", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 255.765, "t": 285.522, "r": 265.752, "b": 289.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "1122", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 281.477, "t": 285.522, "r": 289.229, "b": 289.809, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 9, "end_row_offset_idx": 10, "start_col_offset_idx": 5, "end_col_offset_idx": 6, "text": "955", "column_header": false, "row_header": false, "row_section": false}]}, {"label": "caption", "id": 16, "page_no": 7, "cluster": {"id": 16, "label": "caption", "bbox": {"l": 380.427, "t": 292.551, "r": 549.422, "b": 298.536, "coord_origin": "TOPLEFT"}, "confidence": 0.7499915957450867, "cells": [{"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.427, "r_y0": 298.536, "r_x1": 549.422, "r_y1": 298.536, "r_x2": 549.422, "r_y2": 292.551, "r_x3": 380.427, "r_y3": 292.551, "coord_origin": "TOPLEFT"}, "text": "Text is aligned to match original for ease of viewing", "orig": "Text is aligned to match original for ease of viewing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Text is aligned to match original for ease of viewing"}, {"label": "table", "id": 7, "page_no": 7, "cluster": {"id": 7, "label": "table", "bbox": {"l": 304.9219970703125, "t": 218.51486206054688, "r": 550.2321166992188, "b": 287.90069580078125, "coord_origin": "TOPLEFT"}, "confidence": 0.8899767994880676, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.049, "r_y0": 226.67100000000005, "r_x1": 542.0, "r_y1": 226.67100000000005, "r_x2": 542.0, "r_y2": 221.68899999999996, "r_x3": 459.049, "r_y3": 221.68899999999996, "coord_origin": "TOPLEFT"}, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.822, "r_y0": 232.88099999999997, "r_x1": 507.226, "r_y1": 232.88099999999997, "r_x2": 507.226, "r_y2": 227.899, "r_x3": 493.822, "r_y3": 227.899, "coord_origin": "TOPLEFT"}, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.244, "r_y0": 241.79399999999998, "r_x1": 407.346, "r_y1": 241.79399999999998, "r_x2": 407.346, "r_y2": 236.812, "r_x3": 393.244, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.097, "r_y0": 226.62099999999998, "r_x1": 438.015, "r_y1": 226.62099999999998, "r_x2": 438.015, "r_y2": 221.639, "r_x3": 392.097, "r_y3": 221.639, "coord_origin": "TOPLEFT"}, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.183, "r_y0": 241.79399999999998, "r_x1": 440.988, "r_y1": 241.79399999999998, "r_x2": 440.988, "r_y2": 236.812, "r_x3": 427.183, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.383, "r_y0": 241.79399999999998, "r_x1": 482.485, "r_y1": 241.79399999999998, "r_x2": 482.485, "r_y2": 236.812, "r_x3": 468.383, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.926, "r_y0": 241.79399999999998, "r_x1": 530.73, "r_y1": 241.79399999999998, "r_x2": 530.73, "r_y2": 236.812, "r_x3": 516.926, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 249.65700000000004, "r_x1": 364.656, "r_y1": 249.65700000000004, "r_x2": 364.656, "r_y2": 244.67600000000004, "r_x3": 306.115, "r_y3": 244.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Nonvested on January 1", "orig": "Nonvested on January 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 249.96000000000004, "r_x1": 403.755, "r_y1": 249.96000000000004, "r_x2": 403.755, "r_y2": 244.97799999999995, "r_x3": 396.247, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "1.1", "orig": "1.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.818, "r_y0": 249.96000000000004, "r_x1": 437.327, "r_y1": 249.96000000000004, "r_x2": 437.327, "r_y2": 244.97799999999995, "r_x3": 429.818, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.529, "r_y0": 249.96000000000004, "r_x1": 483.55, "r_y1": 249.96000000000004, "r_x2": 483.55, "r_y2": 244.97799999999995, "r_x3": 465.529, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "90.10 $", "orig": "90.10 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.448, "r_y0": 249.96000000000004, "r_x1": 531.47, "r_y1": 249.96000000000004, "r_x2": 531.47, "r_y2": 244.97799999999995, "r_x3": 513.448, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 258.731, "r_x1": 325.627, "r_y1": 258.731, "r_x2": 325.627, "r_y2": 253.74900000000002, "r_x3": 306.115, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 258.731, "r_x1": 403.755, "r_y1": 258.731, "r_x2": 403.755, "r_y2": 253.74900000000002, "r_x3": 396.247, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.818, "r_y0": 258.731, "r_x1": 437.327, "r_y1": 258.731, "r_x2": 437.327, "r_y2": 253.74900000000002, "r_x3": 429.818, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.436, "r_y0": 258.731, "r_x1": 482.548, "r_y1": 258.731, "r_x2": 482.548, "r_y2": 253.74900000000002, "r_x3": 466.436, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 514.291, "r_y0": 258.731, "r_x1": 530.81, "r_y1": 258.731, "r_x2": 530.81, "r_y2": 253.74900000000002, "r_x3": 514.291, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 266.595, "r_x1": 322.629, "r_y1": 266.595, "r_x2": 322.629, "r_y2": 261.61300000000006, "r_x3": 306.115, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.432, "r_y0": 266.595, "r_x1": 405.536, "r_y1": 266.595, "r_x2": 405.536, "r_y2": 261.61300000000006, "r_x3": 394.432, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "(0.5)", "orig": "(0.5)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.702, "r_y0": 266.595, "r_x1": 438.806, "r_y1": 266.595, "r_x2": 438.806, "r_y2": 261.61300000000006, "r_x3": 427.702, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.555, "r_y0": 266.595, "r_x1": 482.07, "r_y1": 266.595, "r_x2": 482.07, "r_y2": 261.61300000000006, "r_x3": 468.555, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.019, "r_y0": 266.595, "r_x1": 529.534, "r_y1": 266.595, "r_x2": 529.534, "r_y2": 261.61300000000006, "r_x3": 516.019, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 274.688, "r_x1": 356.248, "r_y1": 274.688, "r_x2": 356.248, "r_y2": 269.706, "r_x3": 306.115, "r_y3": 269.706, "coord_origin": "TOPLEFT"}, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.432, "r_y0": 275.366, "r_x1": 405.536, "r_y1": 275.366, "r_x2": 405.536, "r_y2": 270.384, "r_x3": 394.432, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.028, "r_y0": 275.366, "r_x1": 436.428, "r_y1": 275.366, "r_x2": 436.428, "r_y2": 270.384, "r_x3": 431.028, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.831, "r_y0": 275.366, "r_x1": 482.35, "r_y1": 275.366, "r_x2": 482.35, "r_y2": 270.384, "r_x3": 465.831, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.019, "r_y0": 275.366, "r_x1": 529.534, "r_y1": 275.366, "r_x2": 529.534, "r_y2": 270.384, "r_x3": 516.019, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 283.532, "r_x1": 373.358, "r_y1": 283.532, "r_x2": 373.358, "r_y2": 278.55100000000004, "r_x3": 306.115, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 283.532, "r_x1": 403.755, "r_y1": 283.532, "r_x2": 403.755, "r_y2": 278.55100000000004, "r_x3": 396.247, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.516, "r_y0": 283.532, "r_x1": 437.025, "r_y1": 283.532, "r_x2": 437.025, "r_y2": 278.55100000000004, "r_x3": 429.516, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.714, "r_y0": 283.532, "r_x1": 484.74, "r_y1": 283.532, "r_x2": 484.74, "r_y2": 278.55100000000004, "r_x3": 463.714, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.995, "r_y0": 283.532, "r_x1": 534.02, "r_y1": 283.532, "r_x2": 534.02, "r_y2": 278.55100000000004, "r_x3": 512.995, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 124, "label": "text", "bbox": {"l": 459.049, "t": 221.68899999999996, "r": 542.0, "b": 226.67100000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.049, "r_y0": 226.67100000000005, "r_x1": 542.0, "r_y1": 226.67100000000005, "r_x2": 542.0, "r_y2": 221.68899999999996, "r_x3": 459.049, "r_y3": 221.68899999999996, "coord_origin": "TOPLEFT"}, "text": "Weighted Average Grant Date Fair", "orig": "Weighted Average Grant Date Fair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 125, "label": "text", "bbox": {"l": 493.822, "t": 227.899, "r": 507.226, "b": 232.88099999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 493.822, "r_y0": 232.88099999999997, "r_x1": 507.226, "r_y1": 232.88099999999997, "r_x2": 507.226, "r_y2": 227.899, "r_x3": 493.822, "r_y3": 227.899, "coord_origin": "TOPLEFT"}, "text": "Value", "orig": "Value", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 126, "label": "text", "bbox": {"l": 393.244, "t": 236.812, "r": 407.346, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.244, "r_y0": 241.79399999999998, "r_x1": 407.346, "r_y1": 241.79399999999998, "r_x2": 407.346, "r_y2": 236.812, "r_x3": 393.244, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 127, "label": "text", "bbox": {"l": 392.097, "t": 221.639, "r": 438.015, "b": 226.62099999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 392.097, "r_y0": 226.62099999999998, "r_x1": 438.015, "r_y1": 226.62099999999998, "r_x2": 438.015, "r_y2": 221.639, "r_x3": 392.097, "r_y3": 221.639, "coord_origin": "TOPLEFT"}, "text": "Shares (in millions)", "orig": "Shares (in millions)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 128, "label": "text", "bbox": {"l": 427.183, "t": 236.812, "r": 440.988, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.183, "r_y0": 241.79399999999998, "r_x1": 440.988, "r_y1": 241.79399999999998, "r_x2": 440.988, "r_y2": 236.812, "r_x3": 427.183, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 129, "label": "text", "bbox": {"l": 468.383, "t": 236.812, "r": 482.485, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.383, "r_y0": 241.79399999999998, "r_x1": 482.485, "r_y1": 241.79399999999998, "r_x2": 482.485, "r_y2": 236.812, "r_x3": 468.383, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "RSUs", "orig": "RSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 130, "label": "text", "bbox": {"l": 516.926, "t": 236.812, "r": 530.73, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.926, "r_y0": 241.79399999999998, "r_x1": 530.73, "r_y1": 241.79399999999998, "r_x2": 530.73, "r_y2": 236.812, "r_x3": 516.926, "r_y3": 236.812, "coord_origin": "TOPLEFT"}, "text": "PSUs", "orig": "PSUs", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 131, "label": "text", "bbox": {"l": 306.115, "t": 244.67600000000004, "r": 364.656, "b": 249.65700000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 249.65700000000004, "r_x1": 364.656, "r_y1": 249.65700000000004, "r_x2": 364.656, "r_y2": 244.67600000000004, "r_x3": 306.115, "r_y3": 244.67600000000004, "coord_origin": "TOPLEFT"}, "text": "Nonvested on January 1", "orig": "Nonvested on January 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 132, "label": "text", "bbox": {"l": 396.247, "t": 244.97799999999995, "r": 403.755, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 249.96000000000004, "r_x1": 403.755, "r_y1": 249.96000000000004, "r_x2": 403.755, "r_y2": 244.97799999999995, "r_x3": 396.247, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "1.1", "orig": "1.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 133, "label": "text", "bbox": {"l": 429.818, "t": 244.97799999999995, "r": 437.327, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.818, "r_y0": 249.96000000000004, "r_x1": 437.327, "r_y1": 249.96000000000004, "r_x2": 437.327, "r_y2": 244.97799999999995, "r_x3": 429.818, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 134, "label": "text", "bbox": {"l": 465.529, "t": 244.97799999999995, "r": 483.55, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.529, "r_y0": 249.96000000000004, "r_x1": 483.55, "r_y1": 249.96000000000004, "r_x2": 483.55, "r_y2": 244.97799999999995, "r_x3": 465.529, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "90.10 $", "orig": "90.10 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 135, "label": "text", "bbox": {"l": 513.448, "t": 244.97799999999995, "r": 531.47, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 513.448, "r_y0": 249.96000000000004, "r_x1": 531.47, "r_y1": 249.96000000000004, "r_x2": 531.47, "r_y2": 244.97799999999995, "r_x3": 513.448, "r_y3": 244.97799999999995, "coord_origin": "TOPLEFT"}, "text": "$ 91.19", "orig": "$ 91.19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 136, "label": "text", "bbox": {"l": 306.115, "t": 253.74900000000002, "r": 325.627, "b": 258.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 258.731, "r_x1": 325.627, "r_y1": 258.731, "r_x2": 325.627, "r_y2": 253.74900000000002, "r_x3": 306.115, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "Granted", "orig": "Granted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 137, "label": "text", "bbox": {"l": 396.247, "t": 253.74900000000002, "r": 403.755, "b": 258.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 258.731, "r_x1": 403.755, "r_y1": 258.731, "r_x2": 403.755, "r_y2": 253.74900000000002, "r_x3": 396.247, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "0.5", "orig": "0.5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 138, "label": "text", "bbox": {"l": 429.818, "t": 253.74900000000002, "r": 437.327, "b": 258.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.818, "r_y0": 258.731, "r_x1": 437.327, "r_y1": 258.731, "r_x2": 437.327, "r_y2": 253.74900000000002, "r_x3": 429.818, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "0.1", "orig": "0.1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 139, "label": "text", "bbox": {"l": 466.436, "t": 253.74900000000002, "r": 482.548, "b": 258.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.436, "r_y0": 258.731, "r_x1": 482.548, "r_y1": 258.731, "r_x2": 482.548, "r_y2": 253.74900000000002, "r_x3": 466.436, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "117.44", "orig": "117.44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 140, "label": "text", "bbox": {"l": 514.291, "t": 253.74900000000002, "r": 530.81, "b": 258.731, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 514.291, "r_y0": 258.731, "r_x1": 530.81, "r_y1": 258.731, "r_x2": 530.81, "r_y2": 253.74900000000002, "r_x3": 514.291, "r_y3": 253.74900000000002, "coord_origin": "TOPLEFT"}, "text": "122.41", "orig": "122.41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 141, "label": "text", "bbox": {"l": 306.115, "t": 261.61300000000006, "r": 322.629, "b": 266.595, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 266.595, "r_x1": 322.629, "r_y1": 266.595, "r_x2": 322.629, "r_y2": 261.61300000000006, "r_x3": 306.115, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "Vested", "orig": "Vested", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 142, "label": "text", "bbox": {"l": 394.432, "t": 261.61300000000006, "r": 405.536, "b": 266.595, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.432, "r_y0": 266.595, "r_x1": 405.536, "r_y1": 266.595, "r_x2": 405.536, "r_y2": 261.61300000000006, "r_x3": 394.432, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "(0.5)", "orig": "(0.5)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 143, "label": "text", "bbox": {"l": 427.702, "t": 261.61300000000006, "r": 438.806, "b": 266.595, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 427.702, "r_y0": 266.595, "r_x1": 438.806, "r_y1": 266.595, "r_x2": 438.806, "r_y2": 261.61300000000006, "r_x3": 427.702, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 144, "label": "text", "bbox": {"l": 468.555, "t": 261.61300000000006, "r": 482.07, "b": 266.595, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 468.555, "r_y0": 266.595, "r_x1": 482.07, "r_y1": 266.595, "r_x2": 482.07, "r_y2": 261.61300000000006, "r_x3": 468.555, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "87.08", "orig": "87.08", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 145, "label": "text", "bbox": {"l": 516.019, "t": 261.61300000000006, "r": 529.534, "b": 266.595, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.019, "r_y0": 266.595, "r_x1": 529.534, "r_y1": 266.595, "r_x2": 529.534, "r_y2": 261.61300000000006, "r_x3": 516.019, "r_y3": 261.61300000000006, "coord_origin": "TOPLEFT"}, "text": "81.14", "orig": "81.14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 146, "label": "text", "bbox": {"l": 306.115, "t": 269.706, "r": 356.248, "b": 274.688, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 274.688, "r_x1": 356.248, "r_y1": 274.688, "r_x2": 356.248, "r_y2": 269.706, "r_x3": 306.115, "r_y3": 269.706, "coord_origin": "TOPLEFT"}, "text": "Canceled or forfeited", "orig": "Canceled or forfeited", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 147, "label": "text", "bbox": {"l": 394.432, "t": 270.384, "r": 405.536, "b": 275.366, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 394.432, "r_y0": 275.366, "r_x1": 405.536, "r_y1": 275.366, "r_x2": 405.536, "r_y2": 270.384, "r_x3": 394.432, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "(0.1)", "orig": "(0.1)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 148, "label": "text", "bbox": {"l": 431.028, "t": 270.384, "r": 436.428, "b": 275.366, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.028, "r_y0": 275.366, "r_x1": 436.428, "r_y1": 275.366, "r_x2": 436.428, "r_y2": 270.384, "r_x3": 431.028, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "-", "orig": "-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 149, "label": "text", "bbox": {"l": 465.831, "t": 270.384, "r": 482.35, "b": 275.366, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.831, "r_y0": 275.366, "r_x1": 482.35, "r_y1": 275.366, "r_x2": 482.35, "r_y2": 270.384, "r_x3": 465.831, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "102.01", "orig": "102.01", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 150, "label": "text", "bbox": {"l": 516.019, "t": 270.384, "r": 529.534, "b": 275.366, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 516.019, "r_y0": 275.366, "r_x1": 529.534, "r_y1": 275.366, "r_x2": 529.534, "r_y2": 270.384, "r_x3": 516.019, "r_y3": 270.384, "coord_origin": "TOPLEFT"}, "text": "92.18", "orig": "92.18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 151, "label": "text", "bbox": {"l": 306.115, "t": 278.55100000000004, "r": 373.358, "b": 283.532, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 306.115, "r_y0": 283.532, "r_x1": 373.358, "r_y1": 283.532, "r_x2": 373.358, "r_y2": 278.55100000000004, "r_x3": 306.115, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "Nonvested on December 31", "orig": "Nonvested on December 31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 152, "label": "text", "bbox": {"l": 396.247, "t": 278.55100000000004, "r": 403.755, "b": 283.532, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.247, "r_y0": 283.532, "r_x1": 403.755, "r_y1": 283.532, "r_x2": 403.755, "r_y2": 278.55100000000004, "r_x3": 396.247, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "1.0", "orig": "1.0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 153, "label": "text", "bbox": {"l": 429.516, "t": 278.55100000000004, "r": 437.025, "b": 283.532, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 429.516, "r_y0": 283.532, "r_x1": 437.025, "r_y1": 283.532, "r_x2": 437.025, "r_y2": 278.55100000000004, "r_x3": 429.516, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "0.3", "orig": "0.3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 154, "label": "text", "bbox": {"l": 463.714, "t": 278.55100000000004, "r": 484.74, "b": 283.532, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.714, "r_y0": 283.532, "r_x1": 484.74, "r_y1": 283.532, "r_x2": 484.74, "r_y2": 278.55100000000004, "r_x3": 463.714, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "104.85 $", "orig": "104.85 $", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 155, "label": "text", "bbox": {"l": 512.995, "t": 278.55100000000004, "r": 534.02, "b": 283.532, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 512.995, "r_y0": 283.532, "r_x1": 534.02, "r_y1": 283.532, "r_x2": 534.02, "r_y2": 278.55100000000004, "r_x3": 512.995, "r_y3": 278.55100000000004, "coord_origin": "TOPLEFT"}, "text": "$ 104.51", "orig": "$ 104.51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": null, "otsl_seq": ["ecel", "ched", "lcel", "ched", "lcel", "nl", "ecel", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 7, "num_cols": 5, "table_cells": [{"bbox": {"l": 459.049, "t": 221.68899999999996, "r": 542.0, "b": 232.88099999999997, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 3, "end_col_offset_idx": 5, "text": "Weighted Average Grant Date Fair Value", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 393.244, "t": 236.812, "r": 407.346, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "RSUs", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 392.097, "t": 221.639, "r": 438.015, "b": 226.62099999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 2, "start_row_offset_idx": 0, "end_row_offset_idx": 1, "start_col_offset_idx": 1, "end_col_offset_idx": 3, "text": "Shares (in millions)", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 427.183, "t": 236.812, "r": 440.988, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "PSUs", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 468.383, "t": 236.812, "r": 482.485, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "RSUs", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 516.926, "t": 236.812, "r": 530.73, "b": 241.79399999999998, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 1, "end_row_offset_idx": 2, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "PSUs", "column_header": true, "row_header": false, "row_section": false}, {"bbox": {"l": 306.115, "t": 244.67600000000004, "r": 364.656, "b": 249.65700000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Nonvested on January 1", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 396.247, "t": 244.97799999999995, "r": 403.755, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "1.1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 429.818, "t": 244.97799999999995, "r": 437.327, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 465.529, "t": 244.97799999999995, "r": 483.55, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "90.10 $", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 513.448, "t": 244.97799999999995, "r": 531.47, "b": 249.96000000000004, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 2, "end_row_offset_idx": 3, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "$ 91.19", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 306.115, "t": 253.74900000000002, "r": 325.627, "b": 258.731, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Granted", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 396.247, "t": 253.74900000000002, "r": 403.755, "b": 258.731, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "0.5", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 429.818, "t": 253.74900000000002, "r": 437.327, "b": 258.731, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.1", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 466.436, "t": 253.74900000000002, "r": 482.548, "b": 258.731, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "117.44", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 514.291, "t": 253.74900000000002, "r": 530.81, "b": 258.731, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 3, "end_row_offset_idx": 4, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "122.41", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 306.115, "t": 261.61300000000006, "r": 322.629, "b": 266.595, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Vested", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 394.432, "t": 261.61300000000006, "r": 405.536, "b": 266.595, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "(0.5)", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 427.702, "t": 261.61300000000006, "r": 438.806, "b": 266.595, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "(0.1)", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 468.555, "t": 261.61300000000006, "r": 482.07, "b": 266.595, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "87.08", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 516.019, "t": 261.61300000000006, "r": 529.534, "b": 266.595, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 4, "end_row_offset_idx": 5, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "81.14", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 306.115, "t": 269.706, "r": 356.248, "b": 274.688, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Canceled or forfeited", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 394.432, "t": 270.384, "r": 405.536, "b": 275.366, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "(0.1)", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 431.028, "t": 270.384, "r": 436.428, "b": 275.366, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "-", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 465.831, "t": 270.384, "r": 482.35, "b": 275.366, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "102.01", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 516.019, "t": 270.384, "r": 529.534, "b": 275.366, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 5, "end_row_offset_idx": 6, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "92.18", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 306.115, "t": 278.55100000000004, "r": 373.358, "b": 283.532, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 0, "end_col_offset_idx": 1, "text": "Nonvested on December 31", "column_header": false, "row_header": true, "row_section": false}, {"bbox": {"l": 396.247, "t": 278.55100000000004, "r": 403.755, "b": 283.532, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 1, "end_col_offset_idx": 2, "text": "1.0", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 429.516, "t": 278.55100000000004, "r": 437.025, "b": 283.532, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 2, "end_col_offset_idx": 3, "text": "0.3", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 463.714, "t": 278.55100000000004, "r": 484.74, "b": 283.532, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 3, "end_col_offset_idx": 4, "text": "104.85 $", "column_header": false, "row_header": false, "row_section": false}, {"bbox": {"l": 512.995, "t": 278.55100000000004, "r": 534.02, "b": 283.532, "coord_origin": "TOPLEFT"}, "row_span": 1, "col_span": 1, "start_row_offset_idx": 6, "end_row_offset_idx": 7, "start_col_offset_idx": 4, "end_col_offset_idx": 5, "text": "$ 104.51", "column_header": false, "row_header": false, "row_section": false}]}, {"label": "caption", "id": 6, "page_no": 7, "cluster": {"id": 6, "label": "caption", "bbox": {"l": 50.112, "t": 321.146, "r": 545.114, "b": 365.564, "coord_origin": "TOPLEFT"}, "confidence": 0.9140303134918213, "cells": [{"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 329.698, "r_x1": 86.864, "r_y1": 329.698, "r_x2": 86.864, "r_y2": 321.146, "r_x3": 50.112, "r_y3": 321.146, "coord_origin": "TOPLEFT"}, "text": "Figure 5:", "orig": "Figure 5:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.918, "r_y0": 329.698, "r_x1": 545.114, "r_y1": 329.698, "r_x2": 545.114, "r_y2": 321.146, "r_x3": 93.918, "r_y3": 321.146, "coord_origin": "TOPLEFT"}, "text": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "orig": "One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 341.653, "r_x1": 545.114, "r_y1": 341.653, "r_x2": 545.114, "r_y2": 333.101, "r_x3": 50.112, "r_y3": 333.101, "coord_origin": "TOPLEFT"}, "text": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "orig": "demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 353.608, "r_x1": 545.114, "r_y1": 353.608, "r_x2": 545.114, "r_y2": 345.056, "r_x3": 50.112, "r_y3": 345.056, "coord_origin": "TOPLEFT"}, "text": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "orig": "robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 365.564, "r_x1": 139.795, "r_y1": 365.564, "r_x2": 139.795, "r_y2": 357.012, "r_x3": 50.112, "r_y3": 357.012, "coord_origin": "TOPLEFT"}, "text": "the FinTabNet dataset.", "orig": "the FinTabNet dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 5: One of the benefits of TableFormer is that it is language agnostic, as an example, the left part of the illustration demonstrates TableFormer predictions on previously unseen language (Japanese). Additionally, we see that TableFormer is robust to variability in style and content, right side of the illustration shows the example of the TableFormer prediction from the FinTabNet dataset."}, {"label": "picture", "id": 12, "page_no": 7, "cluster": {"id": 12, "label": "picture", "bbox": {"l": 216.76925659179688, "t": 380.4906311035156, "r": 375.7829284667969, "b": 443.34698486328125, "coord_origin": "TOPLEFT"}, "confidence": 0.805853009223938, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.263, "r_y0": 386.393, "r_x1": 342.078, "r_y1": 386.393, "r_x2": 342.078, "r_y2": 381.96, "r_x3": 220.263, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 156, "label": "text", "bbox": {"l": 220.263, "t": 381.96, "r": 342.078, "b": 386.393, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.263, "r_y0": 386.393, "r_x1": 342.078, "r_y1": 386.393, "r_x2": 342.078, "r_y2": 381.96, "r_x3": 220.263, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Red - PDF cells, Green - predicted bounding boxes", "orig": "Red - PDF cells, Green - predicted bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 11, "page_no": 7, "cluster": {"id": 11, "label": "picture", "bbox": {"l": 51.736167907714844, "t": 380.48065185546875, "r": 211.83778381347656, "b": 443.6580810546875, "coord_origin": "TOPLEFT"}, "confidence": 0.8308426737785339, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.715, "r_y0": 386.393, "r_x1": 85.657, "r_y1": 386.393, "r_x2": 85.657, "r_y2": 381.96, "r_x3": 53.715, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 157, "label": "text", "bbox": {"l": 53.715, "t": 381.96, "r": 85.657, "b": 386.393, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.715, "r_y0": 386.393, "r_x1": 85.657, "r_y1": 386.393, "r_x2": 85.657, "r_y2": 381.96, "r_x3": 53.715, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Ground Truth", "orig": "Ground Truth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 13, "page_no": 7, "cluster": {"id": 13, "label": "picture", "bbox": {"l": 383.1364440917969, "t": 381.2313232421875, "r": 542.1132202148438, "b": 442.7749328613281, "coord_origin": "TOPLEFT"}, "confidence": 0.7881615161895752, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 406.686, "r_x1": 443.699, "r_y1": 406.686, "r_x2": 443.699, "r_y2": 401.109, "r_x3": 437.379, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.332, "r_y0": 406.686, "r_x1": 456.651, "r_y1": 406.686, "r_x2": 456.651, "r_y2": 401.109, "r_x3": 450.332, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.285, "r_y0": 406.686, "r_x1": 469.604, "r_y1": 406.686, "r_x2": 469.604, "r_y2": 401.109, "r_x3": 463.285, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.237, "r_y0": 406.686, "r_x1": 482.557, "r_y1": 406.686, "r_x2": 482.557, "r_y2": 401.109, "r_x3": 476.237, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.19, "r_y0": 406.686, "r_x1": 495.509, "r_y1": 406.686, "r_x2": 495.509, "r_y2": 401.109, "r_x3": 489.19, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.143, "r_y0": 406.686, "r_x1": 508.462, "r_y1": 406.686, "r_x2": 508.462, "r_y2": 401.109, "r_x3": 502.143, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.095, "r_y0": 406.686, "r_x1": 521.414, "r_y1": 406.686, "r_x2": 521.414, "r_y2": 401.109, "r_x3": 515.095, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 417.172, "r_x1": 391.601, "r_y1": 417.172, "r_x2": 391.601, "r_y2": 411.594, "r_x3": 385.281, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 417.172, "r_x1": 404.843, "r_y1": 417.172, "r_x2": 404.843, "r_y2": 411.594, "r_x3": 398.523, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 417.172, "r_x1": 417.795, "r_y1": 417.172, "r_x2": 417.795, "r_y2": 411.594, "r_x3": 411.476, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 417.172, "r_x1": 443.699, "r_y1": 417.172, "r_x2": 443.699, "r_y2": 411.594, "r_x3": 437.379, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.332, "r_y0": 417.172, "r_x1": 456.651, "r_y1": 417.172, "r_x2": 456.651, "r_y2": 411.594, "r_x3": 450.332, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.285, "r_y0": 417.172, "r_x1": 469.604, "r_y1": 417.172, "r_x2": 469.604, "r_y2": 411.594, "r_x3": 463.285, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 427.203, "r_x1": 391.601, "r_y1": 427.203, "r_x2": 391.601, "r_y2": 421.626, "r_x3": 385.281, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 427.203, "r_x1": 404.843, "r_y1": 427.203, "r_x2": 404.843, "r_y2": 421.626, "r_x3": 398.523, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 427.203, "r_x1": 417.795, "r_y1": 427.203, "r_x2": 417.795, "r_y2": 421.626, "r_x3": 411.476, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.429, "r_y0": 427.203, "r_x1": 430.748, "r_y1": 427.203, "r_x2": 430.748, "r_y2": 421.626, "r_x3": 424.429, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.381, "r_y0": 427.203, "r_x1": 443.701, "r_y1": 427.203, "r_x2": 443.701, "r_y2": 421.626, "r_x3": 437.381, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.334, "r_y0": 427.203, "r_x1": 456.653, "r_y1": 427.203, "r_x2": 456.653, "r_y2": 421.626, "r_x3": 450.334, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.287, "r_y0": 427.203, "r_x1": 469.606, "r_y1": 427.203, "r_x2": 469.606, "r_y2": 421.626, "r_x3": 463.287, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.239, "r_y0": 427.203, "r_x1": 482.558, "r_y1": 427.203, "r_x2": 482.558, "r_y2": 421.626, "r_x3": 476.239, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.192, "r_y0": 427.203, "r_x1": 495.511, "r_y1": 427.203, "r_x2": 495.511, "r_y2": 421.626, "r_x3": 489.192, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.144, "r_y0": 427.203, "r_x1": 508.464, "r_y1": 427.203, "r_x2": 508.464, "r_y2": 421.626, "r_x3": 502.144, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.097, "r_y0": 427.203, "r_x1": 521.416, "r_y1": 427.203, "r_x2": 521.416, "r_y2": 421.626, "r_x3": 515.097, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.05, "r_y0": 427.203, "r_x1": 534.369, "r_y1": 427.203, "r_x2": 534.369, "r_y2": 421.626, "r_x3": 528.05, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 438.178, "r_x1": 391.601, "r_y1": 438.178, "r_x2": 391.601, "r_y2": 432.6, "r_x3": 385.281, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 438.178, "r_x1": 404.843, "r_y1": 438.178, "r_x2": 404.843, "r_y2": 432.6, "r_x3": 398.523, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 438.178, "r_x1": 417.795, "r_y1": 438.178, "r_x2": 417.795, "r_y2": 432.6, "r_x3": 411.476, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.429, "r_y0": 438.178, "r_x1": 430.748, "r_y1": 438.178, "r_x2": 430.748, "r_y2": 432.6, "r_x3": 424.429, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.381, "r_y0": 438.178, "r_x1": 443.701, "r_y1": 438.178, "r_x2": 443.701, "r_y2": 432.6, "r_x3": 437.381, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.334, "r_y0": 438.178, "r_x1": 456.653, "r_y1": 438.178, "r_x2": 456.653, "r_y2": 432.6, "r_x3": 450.334, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.287, "r_y0": 438.178, "r_x1": 469.606, "r_y1": 438.178, "r_x2": 469.606, "r_y2": 432.6, "r_x3": 463.287, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.239, "r_y0": 438.178, "r_x1": 482.558, "r_y1": 438.178, "r_x2": 482.558, "r_y2": 432.6, "r_x3": 476.239, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.192, "r_y0": 438.178, "r_x1": 495.511, "r_y1": 438.178, "r_x2": 495.511, "r_y2": 432.6, "r_x3": 489.192, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.144, "r_y0": 438.178, "r_x1": 508.464, "r_y1": 438.178, "r_x2": 508.464, "r_y2": 432.6, "r_x3": 502.144, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.097, "r_y0": 438.178, "r_x1": 521.416, "r_y1": 438.178, "r_x2": 521.416, "r_y2": 432.6, "r_x3": 515.097, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.05, "r_y0": 438.178, "r_x1": 534.369, "r_y1": 438.178, "r_x2": 534.369, "r_y2": 432.6, "r_x3": 528.05, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 395.333, "r_x1": 388.441, "r_y1": 395.333, "r_x2": 388.441, "r_y2": 389.756, "r_x3": 385.281, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 395.333, "r_x1": 401.683, "r_y1": 395.333, "r_x2": 401.683, "r_y2": 389.756, "r_x3": 398.523, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.475, "r_y0": 395.333, "r_x1": 414.635, "r_y1": 395.333, "r_x2": 414.635, "r_y2": 389.756, "r_x3": 411.475, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.427, "r_y0": 395.333, "r_x1": 427.587, "r_y1": 395.333, "r_x2": 427.587, "r_y2": 389.756, "r_x3": 424.427, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 395.333, "r_x1": 440.539, "r_y1": 395.333, "r_x2": 440.539, "r_y2": 389.756, "r_x3": 437.379, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.331, "r_y0": 395.333, "r_x1": 453.491, "r_y1": 395.333, "r_x2": 453.491, "r_y2": 389.756, "r_x3": 450.331, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.283, "r_y0": 395.333, "r_x1": 466.443, "r_y1": 395.333, "r_x2": 466.443, "r_y2": 389.756, "r_x3": 463.283, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.235, "r_y0": 395.333, "r_x1": 479.395, "r_y1": 395.333, "r_x2": 479.395, "r_y2": 389.756, "r_x3": 476.235, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.187, "r_y0": 395.333, "r_x1": 492.347, "r_y1": 395.333, "r_x2": 492.347, "r_y2": 389.756, "r_x3": 489.187, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.139, "r_y0": 395.333, "r_x1": 505.299, "r_y1": 395.333, "r_x2": 505.299, "r_y2": 389.756, "r_x3": 502.139, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.091, "r_y0": 395.333, "r_x1": 521.411, "r_y1": 395.333, "r_x2": 521.411, "r_y2": 389.756, "r_x3": 515.091, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.044, "r_y0": 395.333, "r_x1": 534.131, "r_y1": 395.333, "r_x2": 534.131, "r_y2": 389.756, "r_x3": 528.044, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 405.108, "r_x1": 391.601, "r_y1": 405.108, "r_x2": 391.601, "r_y2": 399.531, "r_x3": 385.281, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 405.108, "r_x1": 404.843, "r_y1": 405.108, "r_x2": 404.843, "r_y2": 399.531, "r_x3": 398.523, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 405.108, "r_x1": 417.795, "r_y1": 405.108, "r_x2": 417.795, "r_y2": 399.531, "r_x3": 411.476, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.427, "r_y0": 412.908, "r_x1": 430.746, "r_y1": 412.908, "r_x2": 430.746, "r_y2": 407.331, "r_x3": 424.427, "r_y3": 407.331, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.869, "r_y0": 417.128, "r_x1": 509.189, "r_y1": 417.128, "r_x2": 509.189, "r_y2": 411.55, "r_x3": 502.869, "r_y3": 411.55, "coord_origin": "TOPLEFT"}, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.354, "r_y0": 386.393, "r_x1": 430.993, "r_y1": 386.393, "r_x2": 430.993, "r_y2": 381.96, "r_x3": 384.354, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 158, "label": "text", "bbox": {"l": 437.379, "t": 401.109, "r": 443.699, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 406.686, "r_x1": 443.699, "r_y1": 406.686, "r_x2": 443.699, "r_y2": 401.109, "r_x3": 437.379, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 159, "label": "text", "bbox": {"l": 450.332, "t": 401.109, "r": 456.651, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.332, "r_y0": 406.686, "r_x1": 456.651, "r_y1": 406.686, "r_x2": 456.651, "r_y2": 401.109, "r_x3": 450.332, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "17", "orig": "17", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 160, "label": "text", "bbox": {"l": 463.285, "t": 401.109, "r": 469.604, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.285, "r_y0": 406.686, "r_x1": 469.604, "r_y1": 406.686, "r_x2": 469.604, "r_y2": 401.109, "r_x3": 463.285, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "18", "orig": "18", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 161, "label": "text", "bbox": {"l": 476.237, "t": 401.109, "r": 482.557, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.237, "r_y0": 406.686, "r_x1": 482.557, "r_y1": 406.686, "r_x2": 482.557, "r_y2": 401.109, "r_x3": 476.237, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "19", "orig": "19", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 162, "label": "text", "bbox": {"l": 489.19, "t": 401.109, "r": 495.509, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.19, "r_y0": 406.686, "r_x1": 495.509, "r_y1": 406.686, "r_x2": 495.509, "r_y2": 401.109, "r_x3": 489.19, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "20", "orig": "20", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 163, "label": "text", "bbox": {"l": 502.143, "t": 401.109, "r": 508.462, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.143, "r_y0": 406.686, "r_x1": 508.462, "r_y1": 406.686, "r_x2": 508.462, "r_y2": 401.109, "r_x3": 502.143, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "21", "orig": "21", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 164, "label": "text", "bbox": {"l": 515.095, "t": 401.109, "r": 521.414, "b": 406.686, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.095, "r_y0": 406.686, "r_x1": 521.414, "r_y1": 406.686, "r_x2": 521.414, "r_y2": 401.109, "r_x3": 515.095, "r_y3": 401.109, "coord_origin": "TOPLEFT"}, "text": "22", "orig": "22", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 165, "label": "text", "bbox": {"l": 385.281, "t": 411.594, "r": 391.601, "b": 417.172, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 417.172, "r_x1": 391.601, "r_y1": 417.172, "r_x2": 391.601, "r_y2": 411.594, "r_x3": 385.281, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "23", "orig": "23", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 166, "label": "text", "bbox": {"l": 398.523, "t": 411.594, "r": 404.843, "b": 417.172, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 417.172, "r_x1": 404.843, "r_y1": 417.172, "r_x2": 404.843, "r_y2": 411.594, "r_x3": 398.523, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "24", "orig": "24", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 167, "label": "text", "bbox": {"l": 411.476, "t": 411.594, "r": 417.795, "b": 417.172, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 417.172, "r_x1": 417.795, "r_y1": 417.172, "r_x2": 417.795, "r_y2": 411.594, "r_x3": 411.476, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "25", "orig": "25", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 168, "label": "text", "bbox": {"l": 437.379, "t": 411.594, "r": 443.699, "b": 417.172, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 417.172, "r_x1": 443.699, "r_y1": 417.172, "r_x2": 443.699, "r_y2": 411.594, "r_x3": 437.379, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "26", "orig": "26", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 169, "label": "text", "bbox": {"l": 450.332, "t": 411.594, "r": 456.651, "b": 417.172, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.332, "r_y0": 417.172, "r_x1": 456.651, "r_y1": 417.172, "r_x2": 456.651, "r_y2": 411.594, "r_x3": 450.332, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "27", "orig": "27", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 170, "label": "text", "bbox": {"l": 463.285, "t": 411.594, "r": 469.604, "b": 417.172, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.285, "r_y0": 417.172, "r_x1": 469.604, "r_y1": 417.172, "r_x2": 469.604, "r_y2": 411.594, "r_x3": 463.285, "r_y3": 411.594, "coord_origin": "TOPLEFT"}, "text": "28", "orig": "28", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 171, "label": "text", "bbox": {"l": 385.281, "t": 421.626, "r": 391.601, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 427.203, "r_x1": 391.601, "r_y1": 427.203, "r_x2": 391.601, "r_y2": 421.626, "r_x3": 385.281, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "30", "orig": "30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 172, "label": "text", "bbox": {"l": 398.523, "t": 421.626, "r": 404.843, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 427.203, "r_x1": 404.843, "r_y1": 427.203, "r_x2": 404.843, "r_y2": 421.626, "r_x3": 398.523, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "31", "orig": "31", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 173, "label": "text", "bbox": {"l": 411.476, "t": 421.626, "r": 417.795, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 427.203, "r_x1": 417.795, "r_y1": 427.203, "r_x2": 417.795, "r_y2": 421.626, "r_x3": 411.476, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "32", "orig": "32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 174, "label": "text", "bbox": {"l": 424.429, "t": 421.626, "r": 430.748, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.429, "r_y0": 427.203, "r_x1": 430.748, "r_y1": 427.203, "r_x2": 430.748, "r_y2": 421.626, "r_x3": 424.429, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "33", "orig": "33", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 175, "label": "text", "bbox": {"l": 437.381, "t": 421.626, "r": 443.701, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.381, "r_y0": 427.203, "r_x1": 443.701, "r_y1": 427.203, "r_x2": 443.701, "r_y2": 421.626, "r_x3": 437.381, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "34", "orig": "34", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 176, "label": "text", "bbox": {"l": 450.334, "t": 421.626, "r": 456.653, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.334, "r_y0": 427.203, "r_x1": 456.653, "r_y1": 427.203, "r_x2": 456.653, "r_y2": 421.626, "r_x3": 450.334, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "35", "orig": "35", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 177, "label": "text", "bbox": {"l": 463.287, "t": 421.626, "r": 469.606, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.287, "r_y0": 427.203, "r_x1": 469.606, "r_y1": 427.203, "r_x2": 469.606, "r_y2": 421.626, "r_x3": 463.287, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "36", "orig": "36", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 178, "label": "text", "bbox": {"l": 476.239, "t": 421.626, "r": 482.558, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.239, "r_y0": 427.203, "r_x1": 482.558, "r_y1": 427.203, "r_x2": 482.558, "r_y2": 421.626, "r_x3": 476.239, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "37", "orig": "37", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 179, "label": "text", "bbox": {"l": 489.192, "t": 421.626, "r": 495.511, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.192, "r_y0": 427.203, "r_x1": 495.511, "r_y1": 427.203, "r_x2": 495.511, "r_y2": 421.626, "r_x3": 489.192, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "38", "orig": "38", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 180, "label": "text", "bbox": {"l": 502.144, "t": 421.626, "r": 508.464, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.144, "r_y0": 427.203, "r_x1": 508.464, "r_y1": 427.203, "r_x2": 508.464, "r_y2": 421.626, "r_x3": 502.144, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "39", "orig": "39", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 181, "label": "text", "bbox": {"l": 515.097, "t": 421.626, "r": 521.416, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.097, "r_y0": 427.203, "r_x1": 521.416, "r_y1": 427.203, "r_x2": 521.416, "r_y2": 421.626, "r_x3": 515.097, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "40", "orig": "40", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 182, "label": "text", "bbox": {"l": 528.05, "t": 421.626, "r": 534.369, "b": 427.203, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.05, "r_y0": 427.203, "r_x1": 534.369, "r_y1": 427.203, "r_x2": 534.369, "r_y2": 421.626, "r_x3": 528.05, "r_y3": 421.626, "coord_origin": "TOPLEFT"}, "text": "41", "orig": "41", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 183, "label": "text", "bbox": {"l": 385.281, "t": 432.6, "r": 391.601, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 438.178, "r_x1": 391.601, "r_y1": 438.178, "r_x2": 391.601, "r_y2": 432.6, "r_x3": 385.281, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "42", "orig": "42", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 184, "label": "text", "bbox": {"l": 398.523, "t": 432.6, "r": 404.843, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 438.178, "r_x1": 404.843, "r_y1": 438.178, "r_x2": 404.843, "r_y2": 432.6, "r_x3": 398.523, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "43", "orig": "43", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 185, "label": "text", "bbox": {"l": 411.476, "t": 432.6, "r": 417.795, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 438.178, "r_x1": 417.795, "r_y1": 438.178, "r_x2": 417.795, "r_y2": 432.6, "r_x3": 411.476, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "44", "orig": "44", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 186, "label": "text", "bbox": {"l": 424.429, "t": 432.6, "r": 430.748, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.429, "r_y0": 438.178, "r_x1": 430.748, "r_y1": 438.178, "r_x2": 430.748, "r_y2": 432.6, "r_x3": 424.429, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "45", "orig": "45", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 187, "label": "text", "bbox": {"l": 437.381, "t": 432.6, "r": 443.701, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.381, "r_y0": 438.178, "r_x1": 443.701, "r_y1": 438.178, "r_x2": 443.701, "r_y2": 432.6, "r_x3": 437.381, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "46", "orig": "46", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 188, "label": "text", "bbox": {"l": 450.334, "t": 432.6, "r": 456.653, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.334, "r_y0": 438.178, "r_x1": 456.653, "r_y1": 438.178, "r_x2": 456.653, "r_y2": 432.6, "r_x3": 450.334, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "47", "orig": "47", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 189, "label": "text", "bbox": {"l": 463.287, "t": 432.6, "r": 469.606, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.287, "r_y0": 438.178, "r_x1": 469.606, "r_y1": 438.178, "r_x2": 469.606, "r_y2": 432.6, "r_x3": 463.287, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "48", "orig": "48", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 190, "label": "text", "bbox": {"l": 476.239, "t": 432.6, "r": 482.558, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.239, "r_y0": 438.178, "r_x1": 482.558, "r_y1": 438.178, "r_x2": 482.558, "r_y2": 432.6, "r_x3": 476.239, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "49", "orig": "49", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 191, "label": "text", "bbox": {"l": 489.192, "t": 432.6, "r": 495.511, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.192, "r_y0": 438.178, "r_x1": 495.511, "r_y1": 438.178, "r_x2": 495.511, "r_y2": 432.6, "r_x3": 489.192, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "50", "orig": "50", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 192, "label": "text", "bbox": {"l": 502.144, "t": 432.6, "r": 508.464, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.144, "r_y0": 438.178, "r_x1": 508.464, "r_y1": 438.178, "r_x2": 508.464, "r_y2": 432.6, "r_x3": 502.144, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "51", "orig": "51", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 193, "label": "text", "bbox": {"l": 515.097, "t": 432.6, "r": 521.416, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.097, "r_y0": 438.178, "r_x1": 521.416, "r_y1": 438.178, "r_x2": 521.416, "r_y2": 432.6, "r_x3": 515.097, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "52", "orig": "52", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 194, "label": "text", "bbox": {"l": 528.05, "t": 432.6, "r": 534.369, "b": 438.178, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.05, "r_y0": 438.178, "r_x1": 534.369, "r_y1": 438.178, "r_x2": 534.369, "r_y2": 432.6, "r_x3": 528.05, "r_y3": 432.6, "coord_origin": "TOPLEFT"}, "text": "53", "orig": "53", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 195, "label": "text", "bbox": {"l": 385.281, "t": 389.756, "r": 388.441, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 395.333, "r_x1": 388.441, "r_y1": 395.333, "r_x2": 388.441, "r_y2": 389.756, "r_x3": 385.281, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "0", "orig": "0", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 196, "label": "text", "bbox": {"l": 398.523, "t": 389.756, "r": 401.683, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 395.333, "r_x1": 401.683, "r_y1": 395.333, "r_x2": 401.683, "r_y2": 389.756, "r_x3": 398.523, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "1", "orig": "1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 197, "label": "text", "bbox": {"l": 411.475, "t": 389.756, "r": 414.635, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.475, "r_y0": 395.333, "r_x1": 414.635, "r_y1": 395.333, "r_x2": 414.635, "r_y2": 389.756, "r_x3": 411.475, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 198, "label": "text", "bbox": {"l": 424.427, "t": 389.756, "r": 427.587, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.427, "r_y0": 395.333, "r_x1": 427.587, "r_y1": 395.333, "r_x2": 427.587, "r_y2": 389.756, "r_x3": 424.427, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 199, "label": "text", "bbox": {"l": 437.379, "t": 389.756, "r": 440.539, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.379, "r_y0": 395.333, "r_x1": 440.539, "r_y1": 395.333, "r_x2": 440.539, "r_y2": 389.756, "r_x3": 437.379, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "4", "orig": "4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 200, "label": "text", "bbox": {"l": 450.331, "t": 389.756, "r": 453.491, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 450.331, "r_y0": 395.333, "r_x1": 453.491, "r_y1": 395.333, "r_x2": 453.491, "r_y2": 389.756, "r_x3": 450.331, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "5", "orig": "5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 201, "label": "text", "bbox": {"l": 463.283, "t": 389.756, "r": 466.443, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 463.283, "r_y0": 395.333, "r_x1": 466.443, "r_y1": 395.333, "r_x2": 466.443, "r_y2": 389.756, "r_x3": 463.283, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 202, "label": "text", "bbox": {"l": 476.235, "t": 389.756, "r": 479.395, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.235, "r_y0": 395.333, "r_x1": 479.395, "r_y1": 395.333, "r_x2": 479.395, "r_y2": 389.756, "r_x3": 476.235, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "7", "orig": "7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 203, "label": "text", "bbox": {"l": 489.187, "t": 389.756, "r": 492.347, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.187, "r_y0": 395.333, "r_x1": 492.347, "r_y1": 395.333, "r_x2": 492.347, "r_y2": 389.756, "r_x3": 489.187, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 204, "label": "text", "bbox": {"l": 502.139, "t": 389.756, "r": 505.299, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.139, "r_y0": 395.333, "r_x1": 505.299, "r_y1": 395.333, "r_x2": 505.299, "r_y2": 389.756, "r_x3": 502.139, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 205, "label": "text", "bbox": {"l": 515.091, "t": 389.756, "r": 521.411, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 515.091, "r_y0": 395.333, "r_x1": 521.411, "r_y1": 395.333, "r_x2": 521.411, "r_y2": 389.756, "r_x3": 515.091, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 206, "label": "text", "bbox": {"l": 528.044, "t": 389.756, "r": 534.131, "b": 395.333, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.044, "r_y0": 395.333, "r_x1": 534.131, "r_y1": 395.333, "r_x2": 534.131, "r_y2": 389.756, "r_x3": 528.044, "r_y3": 389.756, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 207, "label": "text", "bbox": {"l": 385.281, "t": 399.531, "r": 391.601, "b": 405.108, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.281, "r_y0": 405.108, "r_x1": 391.601, "r_y1": 405.108, "r_x2": 391.601, "r_y2": 399.531, "r_x3": 385.281, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 208, "label": "text", "bbox": {"l": 398.523, "t": 399.531, "r": 404.843, "b": 405.108, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 398.523, "r_y0": 405.108, "r_x1": 404.843, "r_y1": 405.108, "r_x2": 404.843, "r_y2": 399.531, "r_x3": 398.523, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 209, "label": "text", "bbox": {"l": 411.476, "t": 399.531, "r": 417.795, "b": 405.108, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.476, "r_y0": 405.108, "r_x1": 417.795, "r_y1": 405.108, "r_x2": 417.795, "r_y2": 399.531, "r_x3": 411.476, "r_y3": 399.531, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 210, "label": "text", "bbox": {"l": 424.427, "t": 407.331, "r": 430.746, "b": 412.908, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.427, "r_y0": 412.908, "r_x1": 430.746, "r_y1": 412.908, "r_x2": 430.746, "r_y2": 407.331, "r_x3": 424.427, "r_y3": 407.331, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 211, "label": "text", "bbox": {"l": 502.869, "t": 411.55, "r": 509.189, "b": 417.128, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.869, "r_y0": 417.128, "r_x1": 509.189, "r_y1": 417.128, "r_x2": 509.189, "r_y2": 411.55, "r_x3": 502.869, "r_y3": 411.55, "coord_origin": "TOPLEFT"}, "text": "29", "orig": "29", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 212, "label": "text", "bbox": {"l": 384.354, "t": 381.96, "r": 430.993, "b": 386.393, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 384.354, "r_y0": 386.393, "r_x1": 430.993, "r_y1": 386.393, "r_x2": 430.993, "r_y2": 381.96, "r_x3": 384.354, "r_y3": 381.96, "coord_origin": "TOPLEFT"}, "text": "Predicted Structure", "orig": "Predicted Structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "caption", "id": 5, "page_no": 7, "cluster": {"id": 5, "label": "caption", "bbox": {"l": 62.595, "t": 458.997, "r": 532.63, "b": 467.549, "coord_origin": "TOPLEFT"}, "confidence": 0.9153602719306946, "cells": [{"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.595, "r_y0": 467.549, "r_x1": 98.849, "r_y1": 467.549, "r_x2": 98.849, "r_y2": 458.997, "r_x3": 62.595, "r_y3": 458.997, "coord_origin": "TOPLEFT"}, "text": "Figure 6:", "orig": "Figure 6:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 104.428, "r_y0": 467.549, "r_x1": 532.63, "r_y1": 467.549, "r_x2": 532.63, "r_y2": 458.997, "r_x3": 104.428, "r_y3": 458.997, "coord_origin": "TOPLEFT"}, "text": "An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "orig": "An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 6: An example of TableFormer predictions (bounding boxes and structure) from generated SynthTabNet table."}, {"label": "section_header", "id": 2, "page_no": 7, "cluster": {"id": 2, "label": "section_header", "bbox": {"l": 50.112, "t": 491.395, "r": 163.756, "b": 501.247, "coord_origin": "TOPLEFT"}, "confidence": 0.9561247229576111, "cells": [{"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 501.247, "r_x1": 163.756, "r_y1": 501.247, "r_x2": 163.756, "r_y2": 491.395, "r_x3": 50.112, "r_y3": 491.395, "coord_origin": "TOPLEFT"}, "text": "5.5. Qualitative Analysis", "orig": "5.5. Qualitative Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5.5. Qualitative Analysis"}, {"label": "text", "id": 1, "page_no": 7, "cluster": {"id": 1, "label": "text", "bbox": {"l": 50.112, "t": 537.142, "r": 286.365, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9852361679077148, "cells": [{"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 545.694, "r_x1": 118.505, "r_y1": 545.694, "r_x2": 118.505, "r_y2": 537.142, "r_x3": 62.067, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "We showcase", "orig": "We showcase", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 123.985, "r_y0": 545.694, "r_x1": 151.8, "r_y1": 545.694, "r_x2": 151.8, "r_y2": 537.142, "r_x3": 123.985, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "several", "orig": "several", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.28, "r_y0": 545.694, "r_x1": 212.074, "r_y1": 545.694, "r_x2": 212.074, "r_y2": 537.142, "r_x3": 157.28, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "visualizations", "orig": "visualizations", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.553, "r_y0": 545.694, "r_x1": 229.17, "r_y1": 545.694, "r_x2": 229.17, "r_y2": 537.142, "r_x3": 217.553, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.659, "r_y0": 545.694, "r_x1": 246.833, "r_y1": 545.694, "r_x2": 246.833, "r_y2": 537.142, "r_x3": 234.659, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "the", "orig": "the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 252.313, "r_y0": 545.694, "r_x1": 286.365, "r_y1": 545.694, "r_x2": 286.365, "r_y2": 537.142, "r_x3": 252.313, "r_y3": 537.142, "coord_origin": "TOPLEFT"}, "text": "different", "orig": "different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 557.649, "r_x1": 211.157, "r_y1": 557.649, "r_x2": 211.157, "r_y2": 549.097, "r_x3": 50.112, "r_y3": 549.097, "coord_origin": "TOPLEFT"}, "text": "components of our network on various", "orig": "components of our network on various", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.1, "r_y0": 557.506, "r_x1": 259.175, "r_y1": 557.506, "r_x2": 259.175, "r_y2": 548.918, "r_x3": 215.1, "r_y3": 548.918, "coord_origin": "TOPLEFT"}, "text": "'complex'", "orig": "'complex'", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.12, "r_y0": 557.649, "r_x1": 286.363, "r_y1": 557.649, "r_x2": 286.363, "r_y2": 549.097, "r_x3": 263.12, "r_y3": 549.097, "coord_origin": "TOPLEFT"}, "text": "tables", "orig": "tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 569.604, "r_x1": 231.72, "r_y1": 569.604, "r_x2": 231.72, "r_y2": 561.052, "r_x3": 50.112, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "within datasets presented in this work in Fig.", "orig": "within datasets presented in this work in Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.064, "r_y0": 569.604, "r_x1": 277.03, "r_y1": 569.604, "r_x2": 277.03, "r_y2": 561.052, "r_x3": 236.064, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "5 and Fig.", "orig": "5 and Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.384, "r_y0": 569.604, "r_x1": 286.365, "r_y1": 569.604, "r_x2": 286.365, "r_y2": 561.052, "r_x3": 281.384, "r_y3": 561.052, "coord_origin": "TOPLEFT"}, "text": "6", "orig": "6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 581.559, "r_x1": 286.365, "r_y1": 581.559, "r_x2": 286.365, "r_y2": 573.0070000000001, "r_x3": 50.112, "r_y3": 573.0070000000001, "coord_origin": "TOPLEFT"}, "text": "As it is shown, our model is able to predict bounding boxes", "orig": "As it is shown, our model is able to predict bounding boxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 593.514, "r_x1": 122.341, "r_y1": 593.514, "r_x2": 122.341, "r_y2": 584.962, "r_x3": 50.112, "r_y3": 584.962, "coord_origin": "TOPLEFT"}, "text": "for all table cells,", "orig": "for all table cells,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 126.107, "r_y0": 593.514, "r_x1": 228.004, "r_y1": 593.514, "r_x2": 228.004, "r_y2": 584.962, "r_x3": 126.107, "r_y3": 584.962, "coord_origin": "TOPLEFT"}, "text": "even for the empty ones.", "orig": "even for the empty ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.151, "r_y0": 593.514, "r_x1": 286.365, "r_y1": 593.514, "r_x2": 286.365, "r_y2": 584.962, "r_x3": 234.151, "r_y3": 584.962, "coord_origin": "TOPLEFT"}, "text": "Additionally,", "orig": "Additionally,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 605.47, "r_x1": 286.365, "r_y1": 605.47, "r_x2": 286.365, "r_y2": 596.918, "r_x3": 50.112, "r_y3": 596.918, "coord_origin": "TOPLEFT"}, "text": "our post-processing techniques can extract the cell content", "orig": "our post-processing techniques can extract the cell content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 617.425, "r_x1": 286.365, "r_y1": 617.425, "r_x2": 286.365, "r_y2": 608.873, "r_x3": 50.112, "r_y3": 608.873, "coord_origin": "TOPLEFT"}, "text": "by matching the predicted bounding boxes to the PDF cells", "orig": "by matching the predicted bounding boxes to the PDF cells", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 629.38, "r_x1": 230.873, "r_y1": 629.38, "r_x2": 230.873, "r_y2": 620.828, "r_x3": 50.112, "r_y3": 620.828, "coord_origin": "TOPLEFT"}, "text": "based on their overlap and spatial proximity.", "orig": "based on their overlap and spatial proximity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.855, "r_y0": 629.38, "r_x1": 286.365, "r_y1": 629.38, "r_x2": 286.365, "r_y2": 620.828, "r_x3": 235.855, "r_y3": 620.828, "coord_origin": "TOPLEFT"}, "text": "The left part", "orig": "The left part", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 641.335, "r_x1": 77.121, "r_y1": 641.335, "r_x2": 77.121, "r_y2": 632.783, "r_x3": 50.112, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "of Fig.", "orig": "of Fig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 81.544, "r_y0": 641.335, "r_x1": 286.365, "r_y1": 641.335, "r_x2": 286.365, "r_y2": 632.783, "r_x3": 81.544, "r_y3": 632.783, "coord_origin": "TOPLEFT"}, "text": "5 demonstrates also the adaptability of our method", "orig": "5 demonstrates also the adaptability of our method", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 653.29, "r_x1": 57.863, "r_y1": 653.29, "r_x2": 57.863, "r_y2": 644.738, "r_x3": 50.112, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.436, "r_y0": 653.29, "r_x1": 119.691, "r_y1": 653.29, "r_x2": 119.691, "r_y2": 644.738, "r_x3": 62.436, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "any language,", "orig": "any language,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.782, "r_y0": 653.29, "r_x1": 133.081, "r_y1": 653.29, "r_x2": 133.081, "r_y2": 644.738, "r_x3": 124.782, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "as", "orig": "as", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.653, "r_y0": 653.29, "r_x1": 143.193, "r_y1": 653.29, "r_x2": 143.193, "r_y2": 644.738, "r_x3": 137.653, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.765, "r_y0": 653.29, "r_x1": 214.854, "r_y1": 653.29, "r_x2": 214.854, "r_y2": 644.738, "r_x3": 147.765, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "can successfully", "orig": "can successfully", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.426, "r_y0": 653.29, "r_x1": 246.385, "r_y1": 653.29, "r_x2": 246.385, "r_y2": 644.738, "r_x3": 219.426, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "extract", "orig": "extract", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.958, "r_y0": 653.29, "r_x1": 286.365, "r_y1": 653.29, "r_x2": 286.365, "r_y2": 644.738, "r_x3": 250.958, "r_y3": 644.738, "coord_origin": "TOPLEFT"}, "text": "Japanese", "orig": "Japanese", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 665.245, "r_x1": 286.365, "r_y1": 665.245, "r_x2": 286.365, "r_y2": 656.693, "r_x3": 50.112, "r_y3": 656.693, "coord_origin": "TOPLEFT"}, "text": "text, although the training set contains only English content.", "orig": "text, although the training set contains only English content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 677.201, "r_x1": 286.365, "r_y1": 677.201, "r_x2": 286.365, "r_y2": 668.649, "r_x3": 50.112, "r_y3": 668.649, "coord_origin": "TOPLEFT"}, "text": "We provide more visualizations including the intermediate", "orig": "We provide more visualizations including the intermediate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 689.156, "r_x1": 195.217, "r_y1": 689.156, "r_x2": 195.217, "r_y2": 680.604, "r_x3": 50.112, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "steps in the supplementary material.", "orig": "steps in the supplementary material.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 203, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.431, "r_y0": 689.156, "r_x1": 286.365, "r_y1": 689.156, "r_x2": 286.365, "r_y2": 680.604, "r_x3": 199.431, "r_y3": 680.604, "coord_origin": "TOPLEFT"}, "text": "Overall these illustra-", "orig": "Overall these illustra-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 204, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 50.112, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "tions justify the versatility of our method across a diverse", "orig": "tions justify the versatility of our method across a diverse", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 205, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 226.888, "r_y1": 713.066, "r_x2": 226.888, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "range of table appearances and content type.", "orig": "range of table appearances and content type.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We showcase several visualizations for the different components of our network on various 'complex' tables within datasets presented in this work in Fig. 5 and Fig. 6 As it is shown, our model is able to predict bounding boxes for all table cells, even for the empty ones. Additionally, our post-processing techniques can extract the cell content by matching the predicted bounding boxes to the PDF cells based on their overlap and spatial proximity. The left part of Fig. 5 demonstrates also the adaptability of our method to any language, as it can successfully extract Japanese text, although the training set contains only English content. We provide more visualizations including the intermediate steps in the supplementary material. Overall these illustrations justify the versatility of our method across a diverse range of table appearances and content type."}, {"label": "section_header", "id": 4, "page_no": 7, "cluster": {"id": 4, "label": "section_header", "bbox": {"l": 308.862, "t": 490.709, "r": 460.848, "b": 501.457, "coord_origin": "TOPLEFT"}, "confidence": 0.9436525702476501, "cells": [{"index": 206, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 501.457, "r_x1": 460.848, "r_y1": 501.457, "r_x2": 460.848, "r_y2": 490.709, "r_x3": 308.862, "r_y3": 490.709, "coord_origin": "TOPLEFT"}, "text": "6. Future Work &Conclusion", "orig": "6. Future Work &Conclusion", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "6. Future Work &Conclusion"}, {"label": "text", "id": 0, "page_no": 7, "cluster": {"id": 0, "label": "text", "bbox": {"l": 308.862, "t": 513.162, "r": 545.115, "b": 653.22, "coord_origin": "TOPLEFT"}, "confidence": 0.9875594973564148, "cells": [{"index": 207, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 521.7139999999999, "r_x1": 545.115, "r_y1": 521.7139999999999, "r_x2": 545.115, "r_y2": 513.162, "r_x3": 320.817, "r_y3": 513.162, "coord_origin": "TOPLEFT"}, "text": "In this paper, we presented TableFormer an end-to-end", "orig": "In this paper, we presented TableFormer an end-to-end", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 208, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.669, "r_x1": 545.115, "r_y1": 533.669, "r_x2": 545.115, "r_y2": 525.117, "r_x3": 308.862, "r_y3": 525.117, "coord_origin": "TOPLEFT"}, "text": "transformer based approach to predict table structures and", "orig": "transformer based approach to predict table structures and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 209, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.624, "r_x1": 545.115, "r_y1": 545.624, "r_x2": 545.115, "r_y2": 537.072, "r_x3": 308.862, "r_y3": 537.072, "coord_origin": "TOPLEFT"}, "text": "bounding boxes of cells from an image. This approach en-", "orig": "bounding boxes of cells from an image. This approach en-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 210, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 557.579, "r_x1": 545.115, "r_y1": 557.579, "r_x2": 545.115, "r_y2": 549.027, "r_x3": 308.862, "r_y3": 549.027, "coord_origin": "TOPLEFT"}, "text": "ables us to recreate the table structure, and extract the cell", "orig": "ables us to recreate the table structure, and extract the cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 211, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.534, "r_x1": 524.562, "r_y1": 569.534, "r_x2": 524.562, "r_y2": 560.982, "r_x3": 308.862, "r_y3": 560.982, "coord_origin": "TOPLEFT"}, "text": "content from PDF or OCR by using bounding boxes.", "orig": "content from PDF or OCR by using bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 212, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 529.623, "r_y0": 569.534, "r_x1": 545.115, "r_y1": 569.534, "r_x2": 545.115, "r_y2": 560.982, "r_x3": 529.623, "r_y3": 560.982, "coord_origin": "TOPLEFT"}, "text": "Ad-", "orig": "Ad-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 213, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 581.489, "r_x1": 545.115, "r_y1": 581.489, "r_x2": 545.115, "r_y2": 572.937, "r_x3": 308.862, "r_y3": 572.937, "coord_origin": "TOPLEFT"}, "text": "ditionally, it provides the versatility required in real-world", "orig": "ditionally, it provides the versatility required in real-world", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 214, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 593.4449999999999, "r_x1": 545.115, "r_y1": 593.4449999999999, "r_x2": 545.115, "r_y2": 584.893, "r_x3": 308.862, "r_y3": 584.893, "coord_origin": "TOPLEFT"}, "text": "scenarios when dealing with various types of PDF docu-", "orig": "scenarios when dealing with various types of PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 215, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 605.4, "r_x1": 335.153, "r_y1": 605.4, "r_x2": 335.153, "r_y2": 596.848, "r_x3": 308.862, "r_y3": 596.848, "coord_origin": "TOPLEFT"}, "text": "ments,", "orig": "ments,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 216, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.656, "r_y0": 605.4, "r_x1": 400.468, "r_y1": 605.4, "r_x2": 400.468, "r_y2": 596.848, "r_x3": 339.656, "r_y3": 596.848, "coord_origin": "TOPLEFT"}, "text": "and languages.", "orig": "and languages.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 217, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 408.378, "r_y0": 605.4, "r_x1": 460.672, "r_y1": 605.4, "r_x2": 460.672, "r_y2": 596.848, "r_x3": 408.378, "r_y3": 596.848, "coord_origin": "TOPLEFT"}, "text": "Furthermore,", "orig": "Furthermore,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 218, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.175, "r_y0": 605.4, "r_x1": 545.115, "r_y1": 605.4, "r_x2": 545.115, "r_y2": 596.848, "r_x3": 465.175, "r_y3": 596.848, "coord_origin": "TOPLEFT"}, "text": "our method outper-", "orig": "our method outper-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 219, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 617.355, "r_x1": 495.471, "r_y1": 617.355, "r_x2": 495.471, "r_y2": 608.803, "r_x3": 308.862, "r_y3": 608.803, "coord_origin": "TOPLEFT"}, "text": "forms all state-of-the-arts with a wide margin.", "orig": "forms all state-of-the-arts with a wide margin.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 220, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 500.234, "r_y0": 617.355, "r_x1": 545.115, "r_y1": 617.355, "r_x2": 545.115, "r_y2": 608.803, "r_x3": 500.234, "r_y3": 608.803, "coord_origin": "TOPLEFT"}, "text": "Finally, we", "orig": "Finally, we", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 221, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 629.31, "r_x1": 545.115, "r_y1": 629.31, "r_x2": 545.115, "r_y2": 620.758, "r_x3": 308.862, "r_y3": 620.758, "coord_origin": "TOPLEFT"}, "text": "introduce 'SynthTabNet' a challenging synthetically gen-", "orig": "introduce 'SynthTabNet' a challenging synthetically gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 222, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 641.265, "r_x1": 545.115, "r_y1": 641.265, "r_x2": 545.115, "r_y2": 632.713, "r_x3": 308.862, "r_y3": 632.713, "coord_origin": "TOPLEFT"}, "text": "erated dataset that reinforces missing characteristics from", "orig": "erated dataset that reinforces missing characteristics from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 223, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 653.22, "r_x1": 365.858, "r_y1": 653.22, "r_x2": 365.858, "r_y2": 644.668, "r_x3": 308.862, "r_y3": 644.668, "coord_origin": "TOPLEFT"}, "text": "other datasets.", "orig": "other datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "In this paper, we presented TableFormer an end-to-end transformer based approach to predict table structures and bounding boxes of cells from an image. This approach enables us to recreate the table structure, and extract the cell content from PDF or OCR by using bounding boxes. Additionally, it provides the versatility required in real-world scenarios when dealing with various types of PDF documents, and languages. Furthermore, our method outperforms all state-of-the-arts with a wide margin. Finally, we introduce 'SynthTabNet' a challenging synthetically generated dataset that reinforces missing characteristics from other datasets."}, {"label": "section_header", "id": 3, "page_no": 7, "cluster": {"id": 3, "label": "section_header", "bbox": {"l": 308.862, "t": 672.099, "r": 364.406, "b": 682.847, "coord_origin": "TOPLEFT"}, "confidence": 0.9442470073699951, "cells": [{"index": 224, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 682.847, "r_x1": 364.406, "r_y1": 682.847, "r_x2": 364.406, "r_y2": 672.099, "r_x3": 308.862, "r_y3": 672.099, "coord_origin": "TOPLEFT"}, "text": "References", "orig": "References", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "References"}, {"label": "list_item", "id": 10, "page_no": 7, "cluster": {"id": 10, "label": "list_item", "bbox": {"l": 313.345, "t": 694.204, "r": 545.113, "b": 712.86, "coord_origin": "TOPLEFT"}, "confidence": 0.8318753838539124, "cells": [{"index": 225, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 313.345, "r_y0": 701.901, "r_x1": 323.8, "r_y1": 701.901, "r_x2": 323.8, "r_y2": 694.204, "r_x3": 313.345, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "[1]", "orig": "[1]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 226, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 701.901, "r_x1": 545.109, "r_y1": 701.901, "r_x2": 545.109, "r_y2": 694.204, "r_x3": 328.785, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "orig": "Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 227, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 712.86, "r_x1": 545.113, "r_y1": 712.86, "r_x2": 545.113, "r_y2": 705.163, "r_x3": 328.781, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "orig": "Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[1] Nicolas Carion, Francisco Massa, Gabriel Synnaeve, Nicolas Usunier, Alexander Kirillov, and Sergey Zagoruyko. End-to-"}, {"label": "picture", "id": 15, "page_no": 7, "cluster": {"id": 15, "label": "picture", "bbox": {"l": 305.5836486816406, "t": 98.65415954589844, "r": 554.8258666992188, "b": 180.6267547607422, "coord_origin": "TOPLEFT"}, "confidence": 0.7699173092842102, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 14, "page_no": 7, "cluster": {"id": 14, "label": "picture", "bbox": {"l": 49.97503662109375, "t": 103.71266174316406, "r": 301.6335754394531, "b": 187.5789337158203, "coord_origin": "TOPLEFT"}, "confidence": 0.7873926162719727, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}], "headers": [{"label": "page_footer", "id": 9, "page_no": 7, "cluster": {"id": 9, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8709858059883118, "cells": [{"index": 228, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "8", "orig": "8", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "8"}]}}, {"page_no": 8, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 83.82299999999998, "r_x1": 212.373, "r_y1": 83.82299999999998, "r_x2": 212.373, "r_y2": 76.12599999999998, "r_x3": 70.031, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "end object detection with transformers.", "orig": "end object detection with transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.313, "r_y0": 83.82299999999998, "r_x1": 286.363, "r_y1": 83.82299999999998, "r_x2": 286.363, "r_y2": 76.12599999999998, "r_x3": 217.313, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "In Andrea Vedaldi,", "orig": "In Andrea Vedaldi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 94.78200000000004, "r_x1": 286.363, "r_y1": 94.78200000000004, "r_x2": 286.363, "r_y2": 87.08500000000004, "r_x3": 70.031, "r_y3": 87.08500000000004, "coord_origin": "TOPLEFT"}, "text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 105.74000000000001, "r_x1": 85.722, "r_y1": 105.74000000000001, "r_x2": 85.722, "r_y2": 98.043, "r_x3": 70.031, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "tors,", "orig": "tors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.889, "r_y0": 105.61099999999999, "r_x1": 199.933, "r_y1": 105.61099999999999, "r_x2": 199.933, "r_y2": 97.88099999999997, "r_x3": 87.889, "r_y3": 97.88099999999997, "coord_origin": "TOPLEFT"}, "text": "Computer Vision - ECCV 2020", "orig": "Computer Vision - ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.936, "r_y0": 105.74000000000001, "r_x1": 286.363, "r_y1": 105.74000000000001, "r_x2": 286.363, "r_y2": 98.043, "r_x3": 199.936, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": ", pages 213-229, Cham,", "orig": ", pages 213-229, Cham,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 116.69899999999996, "r_x1": 221.949, "r_y1": 116.69899999999996, "r_x2": 221.949, "r_y2": 109.00199999999995, "r_x3": 70.031, "r_y3": 109.00199999999995, "coord_origin": "TOPLEFT"}, "text": "2020. Springer International Publishing. 5", "orig": "2020. Springer International Publishing. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 127.971, "r_x1": 65.05, "r_y1": 127.971, "r_x2": 65.05, "r_y2": 120.274, "r_x3": 54.595, "r_y3": 120.274, "coord_origin": "TOPLEFT"}, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 127.971, "r_x1": 286.359, "r_y1": 127.971, "r_x2": 286.359, "r_y2": 120.274, "r_x3": 70.035, "r_y3": 120.274, "coord_origin": "TOPLEFT"}, "text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 138.92999999999995, "r_x1": 179.672, "r_y1": 138.92999999999995, "r_x2": 179.672, "r_y2": 131.23299999999995, "r_x3": 70.031, "r_y3": 131.23299999999995, "coord_origin": "TOPLEFT"}, "text": "uan Yin, and Xian-Ling Mao.", "orig": "uan Yin, and Xian-Ling Mao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.581, "r_y0": 138.92999999999995, "r_x1": 286.363, "r_y1": 138.92999999999995, "r_x2": 286.363, "r_y2": 131.23299999999995, "r_x3": 185.581, "r_y3": 131.23299999999995, "coord_origin": "TOPLEFT"}, "text": "Complicated table structure", "orig": "Complicated table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 149.889, "r_x1": 113.115, "r_y1": 149.889, "r_x2": 113.115, "r_y2": 142.192, "r_x3": 70.031, "r_y3": 142.192, "coord_origin": "TOPLEFT"}, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.342, "r_y0": 149.76, "r_x1": 235.308, "r_y1": 149.76, "r_x2": 235.308, "r_y2": 142.02999999999997, "r_x3": 116.342, "r_y3": 142.02999999999997, "coord_origin": "TOPLEFT"}, "text": "arXiv preprint arXiv:1908.04729", "orig": "arXiv preprint arXiv:1908.04729", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.307, "r_y0": 149.889, "r_x1": 267.676, "r_y1": 149.889, "r_x2": 267.676, "r_y2": 142.192, "r_x3": 235.307, "r_y3": 142.192, "coord_origin": "TOPLEFT"}, "text": ", 2019. 3", "orig": ", 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 161.16099999999994, "r_x1": 65.05, "r_y1": 161.16099999999994, "r_x2": 65.05, "r_y2": 153.46400000000006, "r_x3": 54.595, "r_y3": 153.46400000000006, "coord_origin": "TOPLEFT"}, "text": "[3]", "orig": "[3]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 161.16099999999994, "r_x1": 218.779, "r_y1": 161.16099999999994, "r_x2": 218.779, "r_y2": 153.46400000000006, "r_x3": 70.035, "r_y3": 153.46400000000006, "coord_origin": "TOPLEFT"}, "text": "Bertrand Couasnon and Aurelie Lemaitre.", "orig": "Bertrand Couasnon and Aurelie Lemaitre.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.98, "r_y0": 161.03200000000004, "r_x1": 286.363, "r_y1": 161.03200000000004, "r_x2": 286.363, "r_y2": 153.30200000000002, "r_x3": 220.98, "r_y3": 153.30200000000002, "coord_origin": "TOPLEFT"}, "text": "Recognition of Ta-", "orig": "Recognition of Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 171.99099999999999, "r_x1": 125.264, "r_y1": 171.99099999999999, "r_x2": 125.264, "r_y2": 164.26099999999997, "r_x3": 70.031, "r_y3": 164.26099999999997, "coord_origin": "TOPLEFT"}, "text": "bles and Forms", "orig": "bles and Forms", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.261, "r_y0": 172.12, "r_x1": 127.503, "r_y1": 172.12, "r_x2": 127.503, "r_y2": 164.423, "r_x3": 125.261, "r_y3": 164.423, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.986, "r_y0": 172.12, "r_x1": 286.36, "r_y1": 172.12, "r_x2": 286.36, "r_y2": 164.423, "r_x3": 129.986, "r_y3": 164.423, "coord_origin": "TOPLEFT"}, "text": "pages 647-677. Springer London, London,", "orig": "pages 647-677. Springer London, London,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 183.07799999999997, "r_x1": 97.917, "r_y1": 183.07799999999997, "r_x2": 97.917, "r_y2": 175.38099999999997, "r_x3": 70.031, "r_y3": 175.38099999999997, "coord_origin": "TOPLEFT"}, "text": "2014. 2", "orig": "2014. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 194.35000000000002, "r_x1": 65.05, "r_y1": 194.35000000000002, "r_x2": 65.05, "r_y2": 186.65300000000002, "r_x3": 54.595, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "[4]", "orig": "[4]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 194.35000000000002, "r_x1": 91.936, "r_y1": 194.35000000000002, "r_x2": 91.936, "r_y2": 186.65300000000002, "r_x3": 70.035, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Herv\u00b4 e", "orig": "Herv\u00b4 e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 97.101, "r_y0": 194.35000000000002, "r_x1": 124.736, "r_y1": 194.35000000000002, "r_x2": 124.736, "r_y2": 186.65300000000002, "r_x3": 97.101, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "D\u00b4jean,", "orig": "D\u00b4jean,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.575, "r_y0": 194.35000000000002, "r_x1": 107.556, "r_y1": 194.35000000000002, "r_x2": 107.556, "r_y2": 186.65300000000002, "r_x3": 103.575, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "e", "orig": "e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 130.636, "r_y0": 194.35000000000002, "r_x1": 163.497, "r_y1": 194.35000000000002, "r_x2": 163.497, "r_y2": 186.65300000000002, "r_x3": 130.636, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Jean-Luc", "orig": "Jean-Luc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.662, "r_y0": 194.35000000000002, "r_x1": 200.923, "r_y1": 194.35000000000002, "r_x2": 200.923, "r_y2": 186.65300000000002, "r_x3": 168.662, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Meunier,", "orig": "Meunier,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.814, "r_y0": 194.35000000000002, "r_x1": 238.188, "r_y1": 194.35000000000002, "r_x2": 238.188, "r_y2": 186.65300000000002, "r_x3": 206.814, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Liangcai", "orig": "Liangcai", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.352, "r_y0": 194.35000000000002, "r_x1": 260.532, "r_y1": 194.35000000000002, "r_x2": 260.532, "r_y2": 186.65300000000002, "r_x3": 243.352, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Gao,", "orig": "Gao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.432, "r_y0": 194.35000000000002, "r_x1": 286.364, "r_y1": 194.35000000000002, "r_x2": 286.364, "r_y2": 186.65300000000002, "r_x3": 266.432, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Yilun", "orig": "Yilun", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 205.30899999999997, "r_x1": 269.605, "r_y1": 205.30899999999997, "r_x2": 269.605, "r_y2": 197.61199999999997, "r_x3": 70.031, "r_y3": 197.61199999999997, "coord_origin": "TOPLEFT"}, "text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang.", "orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.411, "r_y0": 205.30899999999997, "r_x1": 286.363, "r_y1": 205.30899999999997, "r_x2": 286.363, "r_y2": 197.61199999999997, "r_x3": 274.411, "r_y3": 197.61199999999997, "coord_origin": "TOPLEFT"}, "text": "IC-", "orig": "IC-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 216.26800000000003, "r_x1": 286.363, "r_y1": 216.26800000000003, "r_x2": 286.363, "r_y2": 208.57100000000003, "r_x3": 70.031, "r_y3": 208.57100000000003, "coord_origin": "TOPLEFT"}, "text": "DAR 2019 Competition on Table Detection and Recognition", "orig": "DAR 2019 Competition on Table Detection and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 227.22699999999998, "r_x1": 245.835, "r_y1": 227.22699999999998, "r_x2": 245.835, "r_y2": 219.52999999999997, "r_x3": 70.031, "r_y3": 219.52999999999997, "coord_origin": "TOPLEFT"}, "text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 238.49900000000002, "r_x1": 65.05, "r_y1": 238.49900000000002, "r_x2": 65.05, "r_y2": 230.80200000000002, "r_x3": 54.595, "r_y3": 230.80200000000002, "coord_origin": "TOPLEFT"}, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 238.49900000000002, "r_x1": 286.359, "r_y1": 238.49900000000002, "r_x2": 286.359, "r_y2": 230.80200000000002, "r_x3": 70.035, "r_y3": 230.80200000000002, "coord_origin": "TOPLEFT"}, "text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 249.45799999999997, "r_x1": 286.363, "r_y1": 249.45799999999997, "r_x2": 286.363, "r_y2": 241.76099999999997, "r_x3": 70.031, "r_y3": 241.76099999999997, "coord_origin": "TOPLEFT"}, "text": "Stavros J Perantonis. Automatic table detection in document", "orig": "Stavros J Perantonis. Automatic table detection in document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 260.41600000000005, "r_x1": 108.398, "r_y1": 260.41600000000005, "r_x2": 108.398, "r_y2": 252.71900000000005, "r_x3": 70.031, "r_y3": 252.71900000000005, "coord_origin": "TOPLEFT"}, "text": "images. In", "orig": "images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.645, "r_y0": 260.28700000000003, "r_x1": 286.36, "r_y1": 260.28700000000003, "r_x2": 286.36, "r_y2": 252.55700000000002, "r_x3": 110.645, "r_y3": 252.55700000000002, "coord_origin": "TOPLEFT"}, "text": "International Conference on Pattern Recognition", "orig": "International Conference on Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 271.246, "r_x1": 140.579, "r_y1": 271.246, "r_x2": 140.579, "r_y2": 263.51599999999996, "r_x3": 70.031, "r_y3": 263.51599999999996, "coord_origin": "TOPLEFT"}, "text": "and Image Analysis", "orig": "and Image Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.578, "r_y0": 271.375, "r_x1": 266.475, "r_y1": 271.375, "r_x2": 266.475, "r_y2": 263.678, "r_x3": 140.578, "r_y3": 263.678, "coord_origin": "TOPLEFT"}, "text": ", pages 609-618. Springer, 2005. 2", "orig": ", pages 609-618. Springer, 2005. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 282.647, "r_x1": 65.05, "r_y1": 282.647, "r_x2": 65.05, "r_y2": 274.95000000000005, "r_x3": 54.595, "r_y3": 274.95000000000005, "coord_origin": "TOPLEFT"}, "text": "[6]", "orig": "[6]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 282.647, "r_x1": 286.367, "r_y1": 282.647, "r_x2": 286.367, "r_y2": 274.95000000000005, "r_x3": 70.035, "r_y3": 274.95000000000005, "coord_origin": "TOPLEFT"}, "text": "MaxG\u00a8bel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "orig": "MaxG\u00a8bel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.719, "r_y0": 282.647, "r_x1": 99.202, "r_y1": 282.647, "r_x2": 99.202, "r_y2": 274.95000000000005, "r_x3": 94.719, "r_y3": 274.95000000000005, "coord_origin": "TOPLEFT"}, "text": "o", "orig": "o", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 293.606, "r_x1": 179.574, "r_y1": 293.606, "r_x2": 179.574, "r_y2": 285.909, "r_x3": 70.031, "r_y3": 285.909, "coord_origin": "TOPLEFT"}, "text": "Icdar 2013 table competition.", "orig": "Icdar 2013 table competition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.016, "r_y0": 293.606, "r_x1": 194.485, "r_y1": 293.606, "r_x2": 194.485, "r_y2": 285.909, "r_x3": 187.016, "r_y3": 285.909, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.044, "r_y0": 293.477, "r_x1": 286.363, "r_y1": 293.477, "r_x2": 286.363, "r_y2": 285.747, "r_x3": 198.044, "r_y3": 285.747, "coord_origin": "TOPLEFT"}, "text": "2013 12th International", "orig": "2013 12th International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 304.436, "r_x1": 260.199, "r_y1": 304.436, "r_x2": 260.199, "r_y2": 296.706, "r_x3": 70.031, "r_y3": 296.706, "coord_origin": "TOPLEFT"}, "text": "Conference on Document Analysis and Recognition", "orig": "Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 260.198, "r_y0": 304.565, "r_x1": 262.44, "r_y1": 304.565, "r_x2": 262.44, "r_y2": 296.868, "r_x3": 260.198, "r_y3": 296.868, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.945, "r_y0": 304.565, "r_x1": 286.362, "r_y1": 304.565, "r_x2": 286.362, "r_y2": 296.868, "r_x3": 265.945, "r_y3": 296.868, "coord_origin": "TOPLEFT"}, "text": "pages", "orig": "pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 315.524, "r_x1": 142.749, "r_y1": 315.524, "r_x2": 142.749, "r_y2": 307.827, "r_x3": 70.031, "r_y3": 307.827, "coord_origin": "TOPLEFT"}, "text": "1449-1453, 2013. 2", "orig": "1449-1453, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 326.796, "r_x1": 65.05, "r_y1": 326.796, "r_x2": 65.05, "r_y2": 319.099, "r_x3": 54.595, "r_y3": 319.099, "coord_origin": "TOPLEFT"}, "text": "[7]", "orig": "[7]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 326.796, "r_x1": 199.492, "r_y1": 326.796, "r_x2": 199.492, "r_y2": 319.099, "r_x3": 70.035, "r_y3": 319.099, "coord_origin": "TOPLEFT"}, "text": "EA Green and M Krishnamoorthy.", "orig": "EA Green and M Krishnamoorthy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.988, "r_y0": 326.796, "r_x1": 286.359, "r_y1": 326.796, "r_x2": 286.359, "r_y2": 319.099, "r_x3": 206.988, "r_y3": 319.099, "coord_origin": "TOPLEFT"}, "text": "Recognition of tables", "orig": "Recognition of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 337.754, "r_x1": 176.283, "r_y1": 337.754, "r_x2": 176.283, "r_y2": 330.057, "r_x3": 70.031, "r_y3": 330.057, "coord_origin": "TOPLEFT"}, "text": "using table grammars. procs.", "orig": "using table grammars. procs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.604, "r_y0": 337.754, "r_x1": 190.073, "r_y1": 337.754, "r_x2": 190.073, "r_y2": 330.057, "r_x3": 182.604, "r_y3": 330.057, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.283, "r_y0": 337.625, "r_x1": 286.363, "r_y1": 337.625, "r_x2": 286.363, "r_y2": 329.895, "r_x3": 193.283, "r_y3": 329.895, "coord_origin": "TOPLEFT"}, "text": "Symposium on Document", "orig": "Symposium on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 348.584, "r_x1": 206.347, "r_y1": 348.584, "r_x2": 206.347, "r_y2": 340.854, "r_x3": 70.031, "r_y3": 340.854, "coord_origin": "TOPLEFT"}, "text": "Analysis and Recognition (SDAIR'95)", "orig": "Analysis and Recognition (SDAIR'95)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.346, "r_y0": 348.713, "r_x1": 274.822, "r_y1": 348.713, "r_x2": 274.822, "r_y2": 341.016, "r_x3": 206.346, "r_y3": 341.016, "coord_origin": "TOPLEFT"}, "text": ", pages 261-277. 2", "orig": ", pages 261-277. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 359.985, "r_x1": 65.05, "r_y1": 359.985, "r_x2": 65.05, "r_y2": 352.288, "r_x3": 54.595, "r_y3": 352.288, "coord_origin": "TOPLEFT"}, "text": "[8]", "orig": "[8]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 359.985, "r_x1": 286.359, "r_y1": 359.985, "r_x2": 286.359, "r_y2": 352.288, "r_x3": 70.035, "r_y3": 352.288, "coord_origin": "TOPLEFT"}, "text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 370.944, "r_x1": 234.125, "r_y1": 370.944, "r_x2": 234.125, "r_y2": 363.247, "r_x3": 70.031, "r_y3": 363.247, "coord_origin": "TOPLEFT"}, "text": "dier Stricker, and Muhammad Zeshan Afzal.", "orig": "dier Stricker, and Muhammad Zeshan Afzal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.052, "r_y0": 370.944, "r_x1": 286.363, "r_y1": 370.944, "r_x2": 286.363, "r_y2": 363.247, "r_x3": 240.052, "r_y3": 363.247, "coord_origin": "TOPLEFT"}, "text": "Castabdetec-", "orig": "Castabdetec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 381.903, "r_x1": 85.973, "r_y1": 381.903, "r_x2": 85.973, "r_y2": 374.206, "r_x3": 70.031, "r_y3": 374.206, "coord_origin": "TOPLEFT"}, "text": "tors:", "orig": "tors:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 90.349, "r_y0": 381.903, "r_x1": 286.363, "r_y1": 381.903, "r_x2": 286.363, "r_y2": 374.206, "r_x3": 90.349, "r_y3": 374.206, "coord_origin": "TOPLEFT"}, "text": "Cascade network for table detection in document im-", "orig": "Cascade network for table detection in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 392.862, "r_x1": 286.363, "r_y1": 392.862, "r_x2": 286.363, "r_y2": 385.165, "r_x3": 70.031, "r_y3": 385.165, "coord_origin": "TOPLEFT"}, "text": "ages with recursive feature pyramid and switchable atrous", "orig": "ages with recursive feature pyramid and switchable atrous", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 403.821, "r_x1": 114.576, "r_y1": 403.821, "r_x2": 114.576, "r_y2": 396.124, "r_x3": 70.031, "r_y3": 396.124, "coord_origin": "TOPLEFT"}, "text": "convolution.", "orig": "convolution.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 117.804, "r_y0": 403.692, "r_x1": 186.729, "r_y1": 403.692, "r_x2": 186.729, "r_y2": 395.962, "r_x3": 117.804, "r_y3": 395.962, "coord_origin": "TOPLEFT"}, "text": "Journal of Imaging", "orig": "Journal of Imaging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 186.728, "r_y0": 403.821, "r_x1": 243.001, "r_y1": 403.821, "r_x2": 243.001, "r_y2": 396.124, "r_x3": 186.728, "r_y3": 396.124, "coord_origin": "TOPLEFT"}, "text": ", 7(10), 2021. 1", "orig": ", 7(10), 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 415.092, "r_x1": 65.05, "r_y1": 415.092, "r_x2": 65.05, "r_y2": 407.395, "r_x3": 54.595, "r_y3": 407.395, "coord_origin": "TOPLEFT"}, "text": "[9]", "orig": "[9]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 415.092, "r_x1": 286.359, "r_y1": 415.092, "r_x2": 286.359, "r_y2": 407.395, "r_x3": 70.035, "r_y3": 407.395, "coord_origin": "TOPLEFT"}, "text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 426.051, "r_x1": 147.133, "r_y1": 426.051, "r_x2": 147.133, "r_y2": 418.354, "r_x3": 70.031, "r_y3": 418.354, "coord_origin": "TOPLEFT"}, "text": "shick. Mask r-cnn. In", "orig": "shick. Mask r-cnn. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.156, "r_y0": 425.922, "r_x1": 286.36, "r_y1": 425.922, "r_x2": 286.36, "r_y2": 418.192, "r_x3": 149.156, "r_y3": 418.192, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE International", "orig": "Proceedings of the IEEE International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 436.881, "r_x1": 213.484, "r_y1": 436.881, "r_x2": 213.484, "r_y2": 429.151, "r_x3": 70.031, "r_y3": 429.151, "coord_origin": "TOPLEFT"}, "text": "Conference on Computer Vision (ICCV)", "orig": "Conference on Computer Vision (ICCV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 213.483, "r_y0": 437.01, "r_x1": 261.041, "r_y1": 437.01, "r_x2": 261.041, "r_y2": 429.313, "r_x3": 213.483, "r_y3": 429.313, "coord_origin": "TOPLEFT"}, "text": ", Oct 2017. 1", "orig": ", Oct 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 448.282, "r_x1": 65.05, "r_y1": 448.282, "r_x2": 65.05, "r_y2": 440.585, "r_x3": 50.112, "r_y3": 440.585, "coord_origin": "TOPLEFT"}, "text": "[10]", "orig": "[10]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 448.282, "r_x1": 286.359, "r_y1": 448.282, "r_x2": 286.359, "r_y2": 440.585, "r_x3": 70.035, "r_y3": 440.585, "coord_origin": "TOPLEFT"}, "text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 459.241, "r_x1": 202.743, "r_y1": 459.241, "r_x2": 202.743, "r_y2": 451.544, "r_x3": 70.031, "r_y3": 451.544, "coord_origin": "TOPLEFT"}, "text": "cong Li, Xin Tang, and Rong Xiao.", "orig": "cong Li, Xin Tang, and Rong Xiao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.001, "r_y0": 459.241, "r_x1": 286.363, "r_y1": 459.241, "r_x2": 286.363, "r_y2": 451.544, "r_x3": 209.001, "r_y3": 451.544, "coord_origin": "TOPLEFT"}, "text": "Pingan-vcgroup's so-", "orig": "Pingan-vcgroup's so-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 470.2, "r_x1": 286.363, "r_y1": 470.2, "r_x2": 286.363, "r_y2": 462.503, "r_x3": 70.031, "r_y3": 462.503, "coord_origin": "TOPLEFT"}, "text": "lution for icdar 2021 competition on scientific table image", "orig": "lution for icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 481.159, "r_x1": 141.87, "r_y1": 481.159, "r_x2": 141.87, "r_y2": 473.462, "r_x3": 70.031, "r_y3": 473.462, "coord_origin": "TOPLEFT"}, "text": "recognition to latex.", "orig": "recognition to latex.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.097, "r_y0": 481.03, "r_x1": 166.016, "r_y1": 481.03, "r_x2": 166.016, "r_y2": 473.3, "r_x3": 145.097, "r_y3": 473.3, "coord_origin": "TOPLEFT"}, "text": "ArXiv", "orig": "ArXiv", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.015, "r_y0": 481.159, "r_x1": 259.902, "r_y1": 481.159, "r_x2": 259.902, "r_y2": 473.462, "r_x3": 166.015, "r_y3": 473.462, "coord_origin": "TOPLEFT"}, "text": ", abs/2105.01846, 2021. 2", "orig": ", abs/2105.01846, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 492.43, "r_x1": 65.05, "r_y1": 492.43, "r_x2": 65.05, "r_y2": 484.733, "r_x3": 50.112, "r_y3": 484.733, "coord_origin": "TOPLEFT"}, "text": "[11]", "orig": "[11]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 492.43, "r_x1": 117.091, "r_y1": 492.43, "r_x2": 117.091, "r_y2": 484.733, "r_x3": 70.035, "r_y3": 484.733, "coord_origin": "TOPLEFT"}, "text": "Jianying Hu,", "orig": "Jianying Hu,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 121.054, "r_y0": 492.43, "r_x1": 286.359, "r_y1": 492.43, "r_x2": 286.359, "r_y2": 484.733, "r_x3": 121.054, "r_y3": 484.733, "coord_origin": "TOPLEFT"}, "text": "Ramanujan S Kashi, Daniel P Lopresti, and", "orig": "Ramanujan S Kashi, Daniel P Lopresti, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 503.389, "r_x1": 132.15, "r_y1": 503.389, "r_x2": 132.15, "r_y2": 495.692, "r_x3": 70.031, "r_y3": 495.692, "coord_origin": "TOPLEFT"}, "text": "Gordon Wilfong.", "orig": "Gordon Wilfong.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.691, "r_y0": 503.389, "r_x1": 273.362, "r_y1": 503.389, "r_x2": 273.362, "r_y2": 495.692, "r_x3": 137.691, "r_y3": 495.692, "coord_origin": "TOPLEFT"}, "text": "Medium-independent table detection.", "orig": "Medium-independent table detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.894, "r_y0": 503.389, "r_x1": 286.363, "r_y1": 503.389, "r_x2": 286.363, "r_y2": 495.692, "r_x3": 278.894, "r_y3": 495.692, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 514.219, "r_x1": 106.883, "r_y1": 514.219, "r_x2": 106.883, "r_y2": 506.489, "r_x3": 70.031, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "Document", "orig": "Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 111.796, "r_y0": 514.219, "r_x1": 155.041, "r_y1": 514.219, "r_x2": 155.041, "r_y2": 506.489, "r_x3": 111.796, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.946, "r_y0": 514.219, "r_x1": 173.396, "r_y1": 514.219, "r_x2": 173.396, "r_y2": 506.489, "r_x3": 159.946, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.309, "r_y0": 514.219, "r_x1": 211.046, "r_y1": 514.219, "r_x2": 211.046, "r_y2": 506.489, "r_x3": 178.309, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "Retrieval", "orig": "Retrieval", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.959, "r_y0": 514.219, "r_x1": 227.409, "r_y1": 514.219, "r_x2": 227.409, "r_y2": 506.489, "r_x3": 215.959, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "VII", "orig": "VII", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.405, "r_y0": 514.348, "r_x1": 229.647, "r_y1": 514.348, "r_x2": 229.647, "r_y2": 506.651, "r_x3": 227.405, "r_y3": 506.651, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.56, "r_y0": 514.348, "r_x1": 261.28, "r_y1": 514.348, "r_x2": 261.28, "r_y2": 506.651, "r_x3": 234.56, "r_y3": 506.651, "coord_origin": "TOPLEFT"}, "text": "volume", "orig": "volume", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.185, "r_y0": 514.348, "r_x1": 286.359, "r_y1": 514.348, "r_x2": 286.359, "r_y2": 506.651, "r_x3": 266.185, "r_y3": 506.651, "coord_origin": "TOPLEFT"}, "text": "3967,", "orig": "3967,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 525.307, "r_x1": 286.363, "r_y1": 525.307, "r_x2": 286.363, "r_y2": 517.61, "r_x3": 70.031, "r_y3": 517.61, "coord_origin": "TOPLEFT"}, "text": "pages 291-302. International Society for Optics and Photon-", "orig": "pages 291-302. International Society for Optics and Photon-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 536.266, "r_x1": 112.361, "r_y1": 536.266, "r_x2": 112.361, "r_y2": 528.569, "r_x3": 70.031, "r_y3": 528.569, "coord_origin": "TOPLEFT"}, "text": "ics, 1999. 2", "orig": "ics, 1999. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 547.538, "r_x1": 65.05, "r_y1": 547.538, "r_x2": 65.05, "r_y2": 539.841, "r_x3": 50.112, "r_y3": 539.841, "coord_origin": "TOPLEFT"}, "text": "[12]", "orig": "[12]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 547.538, "r_x1": 126.407, "r_y1": 547.538, "r_x2": 126.407, "r_y2": 539.841, "r_x3": 70.035, "r_y3": 539.841, "coord_origin": "TOPLEFT"}, "text": "Matthew Hurst.", "orig": "Matthew Hurst.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 130.648, "r_y0": 547.538, "r_x1": 286.359, "r_y1": 547.538, "r_x2": 286.359, "r_y2": 539.841, "r_x3": 130.648, "r_y3": 539.841, "coord_origin": "TOPLEFT"}, "text": "A constraint-based approach to table struc-", "orig": "A constraint-based approach to table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 558.4970000000001, "r_x1": 124.654, "r_y1": 558.4970000000001, "r_x2": 124.654, "r_y2": 550.8, "r_x3": 70.031, "r_y3": 550.8, "coord_origin": "TOPLEFT"}, "text": "ture derivation.", "orig": "ture derivation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.815, "r_y0": 558.4970000000001, "r_x1": 136.284, "r_y1": 558.4970000000001, "r_x2": 136.284, "r_y2": 550.8, "r_x3": 128.815, "r_y3": 550.8, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.811, "r_y0": 558.3679999999999, "r_x1": 286.362, "r_y1": 558.3679999999999, "r_x2": 286.362, "r_y2": 550.638, "r_x3": 138.811, "r_y3": 550.638, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the Seventh International", "orig": "Proceedings of the Seventh International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 569.327, "r_x1": 286.363, "r_y1": 569.327, "r_x2": 286.363, "r_y2": 561.597, "r_x3": 70.031, "r_y3": 561.597, "coord_origin": "TOPLEFT"}, "text": "Conference on Document Analysis and Recognition - Volume", "orig": "Conference on Document Analysis and Recognition - Volume", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 580.2860000000001, "r_x1": 74.514, "r_y1": 580.2860000000001, "r_x2": 74.514, "r_y2": 572.556, "r_x3": 70.031, "r_y3": 572.556, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 74.514, "r_y0": 580.415, "r_x1": 76.756, "r_y1": 580.415, "r_x2": 76.756, "r_y2": 572.718, "r_x3": 74.514, "r_y3": 572.718, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 79.06, "r_y0": 580.415, "r_x1": 286.363, "r_y1": 580.415, "r_x2": 286.363, "r_y2": 572.718, "r_x3": 79.06, "r_y3": 572.718, "coord_origin": "TOPLEFT"}, "text": "ICDAR '03, page 911, USA, 2003. IEEE Computer Soci-", "orig": "ICDAR '03, page 911, USA, 2003. IEEE Computer Soci-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 591.373, "r_x1": 82.647, "r_y1": 591.373, "r_x2": 82.647, "r_y2": 583.6759999999999, "r_x3": 70.031, "r_y3": 583.6759999999999, "coord_origin": "TOPLEFT"}, "text": "ety.", "orig": "ety.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.875, "r_y0": 591.373, "r_x1": 90.358, "r_y1": 591.373, "r_x2": 90.358, "r_y2": 583.6759999999999, "r_x3": 85.875, "r_y3": 583.6759999999999, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 602.645, "r_x1": 65.05, "r_y1": 602.645, "r_x2": 65.05, "r_y2": 594.948, "r_x3": 50.112, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "[13]", "orig": "[13]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 602.645, "r_x1": 116.302, "r_y1": 602.645, "r_x2": 116.302, "r_y2": 594.948, "r_x3": 70.035, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Thotreingam", "orig": "Thotreingam", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 121.368, "r_y0": 602.645, "r_x1": 144.161, "r_y1": 602.645, "r_x2": 144.161, "r_y2": 594.948, "r_x3": 121.368, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Kasar,", "orig": "Kasar,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.926, "r_y0": 602.645, "r_x1": 186.796, "r_y1": 602.645, "r_x2": 186.796, "r_y2": 594.948, "r_x3": 149.926, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Philippine", "orig": "Philippine", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 191.862, "r_y0": 602.645, "r_x1": 217.013, "r_y1": 602.645, "r_x2": 217.013, "r_y2": 594.948, "r_x3": 191.862, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Barlas,", "orig": "Barlas,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.778, "r_y0": 602.645, "r_x1": 257.146, "r_y1": 602.645, "r_x2": 257.146, "r_y2": 594.948, "r_x3": 222.778, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Sebastien", "orig": "Sebastien", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.203, "r_y0": 602.645, "r_x1": 286.359, "r_y1": 602.645, "r_x2": 286.359, "r_y2": 594.948, "r_x3": 262.203, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Adam,", "orig": "Adam,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 613.604, "r_x1": 214.838, "r_y1": 613.604, "r_x2": 214.838, "r_y2": 605.907, "r_x3": 70.031, "r_y3": 605.907, "coord_origin": "TOPLEFT"}, "text": "Cl\u00b4ment Chatelain, and Thierry Paquet.", "orig": "Cl\u00b4ment Chatelain, and Thierry Paquet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.504, "r_y0": 613.604, "r_x1": 82.485, "r_y1": 613.604, "r_x2": 82.485, "r_y2": 605.907, "r_x3": 78.504, "r_y3": 605.907, "coord_origin": "TOPLEFT"}, "text": "e", "orig": "e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.949, "r_y0": 613.604, "r_x1": 286.363, "r_y1": 613.604, "r_x2": 286.363, "r_y2": 605.907, "r_x3": 219.949, "r_y3": 605.907, "coord_origin": "TOPLEFT"}, "text": "Learning to detect", "orig": "Learning to detect", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 624.563, "r_x1": 286.363, "r_y1": 624.563, "r_x2": 286.363, "r_y2": 616.866, "r_x3": 70.031, "r_y3": 616.866, "coord_origin": "TOPLEFT"}, "text": "tables in scanned document images using line information.", "orig": "tables in scanned document images using line information.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 635.5219999999999, "r_x1": 77.5, "r_y1": 635.5219999999999, "r_x2": 77.5, "r_y2": 627.825, "r_x3": 70.031, "r_y3": 627.825, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 79.92, "r_y0": 635.393, "r_x1": 286.362, "r_y1": 635.393, "r_x2": 286.362, "r_y2": 627.663, "r_x3": 79.92, "r_y3": 627.663, "coord_origin": "TOPLEFT"}, "text": "2013 12th International Conference on Document Analy-", "orig": "2013 12th International Conference on Document Analy-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 646.352, "r_x1": 140.677, "r_y1": 646.352, "r_x2": 140.677, "r_y2": 638.6220000000001, "r_x3": 70.031, "r_y3": 638.6220000000001, "coord_origin": "TOPLEFT"}, "text": "sis and Recognition", "orig": "sis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.676, "r_y0": 646.481, "r_x1": 264.439, "r_y1": 646.481, "r_x2": 264.439, "r_y2": 638.784, "r_x3": 140.676, "r_y3": 638.784, "coord_origin": "TOPLEFT"}, "text": ", pages 1185-1189. IEEE, 2013. 2", "orig": ", pages 1185-1189. IEEE, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 657.7529999999999, "r_x1": 65.05, "r_y1": 657.7529999999999, "r_x2": 65.05, "r_y2": 650.056, "r_x3": 50.112, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "[14]", "orig": "[14]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 657.7529999999999, "r_x1": 91.447, "r_y1": 657.7529999999999, "r_x2": 91.447, "r_y2": 650.056, "r_x3": 70.035, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Pratik", "orig": "Pratik", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.092, "r_y0": 657.7529999999999, "r_x1": 119.745, "r_y1": 657.7529999999999, "r_x2": 119.745, "r_y2": 650.056, "r_x3": 96.092, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Kayal,", "orig": "Kayal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.99, "r_y0": 657.7529999999999, "r_x1": 149.397, "r_y1": 657.7529999999999, "r_x2": 149.397, "r_y2": 650.056, "r_x3": 124.99, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Mrinal", "orig": "Mrinal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.042, "r_y0": 657.7529999999999, "r_x1": 180.188, "r_y1": 657.7529999999999, "r_x2": 180.188, "r_y2": 650.056, "r_x3": 154.042, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Anand,", "orig": "Anand,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.433, "r_y0": 657.7529999999999, "r_x1": 206.845, "r_y1": 657.7529999999999, "r_x2": 206.845, "r_y2": 650.056, "r_x3": 185.433, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Harsh", "orig": "Harsh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.489, "r_y0": 657.7529999999999, "r_x1": 234.147, "r_y1": 657.7529999999999, "r_x2": 234.147, "r_y2": 650.056, "r_x3": 211.489, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Desai,", "orig": "Desai,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.393, "r_y0": 657.7529999999999, "r_x1": 252.34, "r_y1": 657.7529999999999, "r_x2": 252.34, "r_y2": 650.056, "r_x3": 239.393, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.976, "r_y0": 657.7529999999999, "r_x1": 286.359, "r_y1": 657.7529999999999, "r_x2": 286.359, "r_y2": 650.056, "r_x3": 256.976, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Mayank", "orig": "Mayank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 668.711, "r_x1": 93.2, "r_y1": 668.711, "r_x2": 93.2, "r_y2": 661.014, "r_x3": 70.031, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "Singh.", "orig": "Singh.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 102.202, "r_y0": 668.711, "r_x1": 120.619, "r_y1": 668.711, "r_x2": 120.619, "r_y2": 661.014, "r_x3": 102.202, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "Icdar", "orig": "Icdar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.672, "r_y0": 668.711, "r_x1": 238.922, "r_y1": 668.711, "r_x2": 238.922, "r_y2": 661.014, "r_x3": 124.672, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "2021 competition on scientific", "orig": "2021 competition on scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.975, "r_y0": 668.711, "r_x1": 260.406, "r_y1": 668.711, "r_x2": 260.406, "r_y2": 661.014, "r_x3": 242.975, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.449, "r_y0": 668.711, "r_x1": 286.363, "r_y1": 668.711, "r_x2": 286.363, "r_y2": 661.014, "r_x3": 264.449, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 679.67, "r_x1": 171.997, "r_y1": 679.67, "r_x2": 171.997, "r_y2": 671.973, "r_x3": 70.031, "r_y3": 671.973, "coord_origin": "TOPLEFT"}, "text": "recognition to latex, 2021. 2", "orig": "recognition to latex, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 690.942, "r_x1": 65.05, "r_y1": 690.942, "r_x2": 65.05, "r_y2": 683.245, "r_x3": 50.112, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "[15]", "orig": "[15]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 690.942, "r_x1": 286.359, "r_y1": 690.942, "r_x2": 286.359, "r_y2": 683.245, "r_x3": 70.035, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "Harold WKuhn. The hungarian method for the assignment", "orig": "Harold WKuhn. The hungarian method for the assignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 701.901, "r_x1": 102.158, "r_y1": 701.901, "r_x2": 102.158, "r_y2": 694.204, "r_x3": 70.031, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "problem.", "orig": "problem.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 107.55, "r_y0": 701.772, "r_x1": 231.475, "r_y1": 701.772, "r_x2": 231.475, "r_y2": 694.042, "r_x3": 107.55, "r_y3": 694.042, "coord_origin": "TOPLEFT"}, "text": "Naval research logistics quarterly", "orig": "Naval research logistics quarterly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 231.476, "r_y0": 701.901, "r_x1": 233.718, "r_y1": 701.901, "r_x2": 233.718, "r_y2": 694.204, "r_x3": 231.476, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.802, "r_y0": 701.901, "r_x1": 286.359, "r_y1": 701.901, "r_x2": 286.359, "r_y2": 694.204, "r_x3": 236.802, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "2(1-2):83-97,", "orig": "2(1-2):83-97,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 712.86, "r_x1": 97.917, "r_y1": 712.86, "r_x2": 97.917, "r_y2": 705.163, "r_x3": 70.031, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "1955. 6", "orig": "1955. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 83.82299999999998, "r_x1": 323.8, "r_y1": 83.82299999999998, "r_x2": 323.8, "r_y2": 76.12599999999998, "r_x3": 308.862, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "[16]", "orig": "[16]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 83.82299999999998, "r_x1": 351.192, "r_y1": 83.82299999999998, "r_x2": 351.192, "r_y2": 76.12599999999998, "r_x3": 328.785, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Girish", "orig": "Girish", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 355.308, "r_y0": 83.82299999999998, "r_x1": 389.291, "r_y1": 83.82299999999998, "r_x2": 389.291, "r_y2": 76.12599999999998, "r_x3": 355.308, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Kulkarni,", "orig": "Kulkarni,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.863, "r_y0": 83.82299999999998, "r_x1": 420.225, "r_y1": 83.82299999999998, "r_x2": 420.225, "r_y2": 76.12599999999998, "r_x3": 393.863, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Visruth", "orig": "Visruth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.331, "r_y0": 83.82299999999998, "r_x1": 454.961, "r_y1": 83.82299999999998, "r_x2": 454.961, "r_y2": 76.12599999999998, "r_x3": 424.331, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Premraj,", "orig": "Premraj,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.533, "r_y0": 83.82299999999998, "r_x1": 486.881, "r_y1": 83.82299999999998, "r_x2": 486.881, "r_y2": 76.12599999999998, "r_x3": 459.533, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Vicente", "orig": "Vicente", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.988, "r_y0": 83.82299999999998, "r_x1": 524.1, "r_y1": 83.82299999999998, "r_x2": 524.1, "r_y2": 76.12599999999998, "r_x3": 490.988, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Ordonez,", "orig": "Ordonez,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.673, "r_y0": 83.82299999999998, "r_x1": 545.109, "r_y1": 83.82299999999998, "r_x2": 545.109, "r_y2": 76.12599999999998, "r_x3": 528.673, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Sag-", "orig": "Sag-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 94.78099999999995, "r_x1": 545.113, "r_y1": 94.78099999999995, "r_x2": 545.113, "r_y2": 87.08399999999995, "r_x3": 328.781, "r_y3": 87.08399999999995, "coord_origin": "TOPLEFT"}, "text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 105.74000000000001, "r_x1": 390.963, "r_y1": 105.74000000000001, "r_x2": 390.963, "r_y2": 98.043, "r_x3": 328.781, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "Tamara L. Berg.", "orig": "Tamara L. Berg.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.27, "r_y0": 105.74000000000001, "r_x1": 435.14, "r_y1": 105.74000000000001, "r_x2": 435.14, "r_y2": 98.043, "r_x3": 400.27, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "Babytalk:", "orig": "Babytalk:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.713, "r_y0": 105.74000000000001, "r_x1": 494.507, "r_y1": 105.74000000000001, "r_x2": 494.507, "r_y2": 98.043, "r_x3": 441.713, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "Understanding", "orig": "Understanding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.649, "r_y0": 105.74000000000001, "r_x1": 545.113, "r_y1": 105.74000000000001, "r_x2": 545.113, "r_y2": 98.043, "r_x3": 498.649, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "and generat-", "orig": "and generat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 116.69899999999996, "r_x1": 440.807, "r_y1": 116.69899999999996, "r_x2": 440.807, "r_y2": 109.00199999999995, "r_x3": 328.781, "r_y3": 109.00199999999995, "coord_origin": "TOPLEFT"}, "text": "ing simple image descriptions.", "orig": "ing simple image descriptions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 446.635, "r_y0": 116.57000000000005, "r_x1": 545.113, "r_y1": 116.57000000000005, "r_x2": 545.113, "r_y2": 108.84000000000003, "r_x3": 446.635, "r_y3": 108.84000000000003, "coord_origin": "TOPLEFT"}, "text": "IEEE Transactions on Pat-", "orig": "IEEE Transactions on Pat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 127.529, "r_x1": 471.132, "r_y1": 127.529, "r_x2": 471.132, "r_y2": 119.79899999999998, "r_x3": 328.781, "r_y3": 119.79899999999998, "coord_origin": "TOPLEFT"}, "text": "tern Analysis and Machine Intelligence", "orig": "tern Analysis and Machine Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 471.133, "r_y0": 127.65800000000002, "r_x1": 473.375, "r_y1": 127.65800000000002, "r_x2": 473.375, "r_y2": 119.96100000000001, "r_x3": 471.133, "r_y3": 119.96100000000001, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.127, "r_y0": 127.65800000000002, "r_x1": 545.115, "r_y1": 127.65800000000002, "r_x2": 545.115, "r_y2": 119.96100000000001, "r_x3": 476.127, "r_y3": 119.96100000000001, "coord_origin": "TOPLEFT"}, "text": "35(12):2891-2903,", "orig": "35(12):2891-2903,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 138.61699999999996, "r_x1": 356.667, "r_y1": 138.61699999999996, "r_x2": 356.667, "r_y2": 130.91999999999996, "r_x3": 328.781, "r_y3": 130.91999999999996, "coord_origin": "TOPLEFT"}, "text": "2013. 4", "orig": "2013. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 150.063, "r_x1": 323.8, "r_y1": 150.063, "r_x2": 323.8, "r_y2": 142.36599999999999, "r_x3": 308.862, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "[17]", "orig": "[17]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 150.063, "r_x1": 375.698, "r_y1": 150.063, "r_x2": 375.698, "r_y2": 142.36599999999999, "r_x3": 328.785, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Minghao Li,", "orig": "Minghao Li,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.557, "r_y0": 150.063, "r_x1": 392.51, "r_y1": 150.063, "r_x2": 392.51, "r_y2": 142.36599999999999, "r_x3": 380.557, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Lei", "orig": "Lei", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.84, "r_y0": 150.063, "r_x1": 412.038, "r_y1": 150.063, "r_x2": 412.038, "r_y2": 142.36599999999999, "r_x3": 396.84, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Cui,", "orig": "Cui,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.889, "r_y0": 150.063, "r_x1": 478.246, "r_y1": 150.063, "r_x2": 478.246, "r_y2": 142.36599999999999, "r_x3": 416.889, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Shaohan Huang,", "orig": "Shaohan Huang,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.097, "r_y0": 150.063, "r_x1": 500.035, "r_y1": 150.063, "r_x2": 500.035, "r_y2": 142.36599999999999, "r_x3": 483.097, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Furu", "orig": "Furu", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 504.365, "r_y0": 150.063, "r_x1": 520.828, "r_y1": 150.063, "r_x2": 520.828, "r_y2": 142.36599999999999, "r_x3": 504.365, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Wei,", "orig": "Wei,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 525.679, "r_y0": 150.063, "r_x1": 545.109, "r_y1": 150.063, "r_x2": 545.109, "r_y2": 142.36599999999999, "r_x3": 525.679, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Ming", "orig": "Ming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 161.02099999999996, "r_x1": 414.446, "r_y1": 161.02099999999996, "r_x2": 414.446, "r_y2": 153.32399999999996, "r_x3": 328.781, "r_y3": 153.32399999999996, "coord_origin": "TOPLEFT"}, "text": "Zhou, and Zhoujun Li.", "orig": "Zhou, and Zhoujun Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 421.825, "r_y0": 161.02099999999996, "r_x1": 461.448, "r_y1": 161.02099999999996, "r_x2": 461.448, "r_y2": 153.32399999999996, "r_x3": 421.825, "r_y3": 153.32399999999996, "coord_origin": "TOPLEFT"}, "text": "Tablebank:", "orig": "Tablebank:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.828, "r_y0": 161.02099999999996, "r_x1": 545.113, "r_y1": 161.02099999999996, "r_x2": 545.113, "r_y2": 153.32399999999996, "r_x3": 466.828, "r_y3": 153.32399999999996, "coord_origin": "TOPLEFT"}, "text": "A benchmark dataset", "orig": "A benchmark dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 171.98000000000002, "r_x1": 493.628, "r_y1": 171.98000000000002, "r_x2": 493.628, "r_y2": 164.28300000000002, "r_x3": 328.781, "r_y3": 164.28300000000002, "coord_origin": "TOPLEFT"}, "text": "for table detection and recognition, 2019. 2, 3", "orig": "for table detection and recognition, 2019. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 183.42600000000004, "r_x1": 323.8, "r_y1": 183.42600000000004, "r_x2": 323.8, "r_y2": 175.72900000000004, "r_x3": 308.862, "r_y3": 175.72900000000004, "coord_origin": "TOPLEFT"}, "text": "[18]", "orig": "[18]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 183.42600000000004, "r_x1": 545.109, "r_y1": 183.42600000000004, "r_x2": 545.109, "r_y2": 175.72900000000004, "r_x3": 328.785, "r_y3": 175.72900000000004, "coord_origin": "TOPLEFT"}, "text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 194.385, "r_x1": 375.397, "r_y1": 194.385, "r_x2": 375.397, "r_y2": 186.688, "r_x3": 328.781, "r_y3": 186.688, "coord_origin": "TOPLEFT"}, "text": "Xianhui Liu.", "orig": "Xianhui Liu.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 381.154, "r_y0": 194.385, "r_x1": 399.58, "r_y1": 194.385, "r_x2": 399.58, "r_y2": 186.688, "r_x3": 381.154, "r_y3": 186.688, "coord_origin": "TOPLEFT"}, "text": "Gfte:", "orig": "Gfte:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 403.937, "r_y0": 194.385, "r_x1": 545.113, "r_y1": 194.385, "r_x2": 545.113, "r_y2": 186.688, "r_x3": 403.937, "r_y3": 186.688, "coord_origin": "TOPLEFT"}, "text": "Graph-based financial table extraction.", "orig": "Graph-based financial table extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 205.34400000000005, "r_x1": 545.113, "r_y1": 205.34400000000005, "r_x2": 545.113, "r_y2": 197.64700000000005, "r_x3": 328.781, "r_y3": 197.64700000000005, "coord_origin": "TOPLEFT"}, "text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 216.303, "r_x1": 545.113, "r_y1": 216.303, "r_x2": 545.113, "r_y2": 208.606, "r_x3": 328.781, "r_y3": 208.606, "coord_origin": "TOPLEFT"}, "text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 227.26199999999994, "r_x1": 365.382, "r_y1": 227.26199999999994, "r_x2": 365.382, "r_y2": 219.56500000000005, "r_x3": 328.781, "r_y3": 219.56500000000005, "coord_origin": "TOPLEFT"}, "text": "Escalante,", "orig": "Escalante,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 369.237, "r_y0": 227.26199999999994, "r_x1": 479.264, "r_y1": 227.26199999999994, "r_x2": 479.264, "r_y2": 219.56500000000005, "r_x3": 369.237, "r_y3": 219.56500000000005, "coord_origin": "TOPLEFT"}, "text": "and Roberto Vezzani, editors,", "orig": "and Roberto Vezzani, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.119, "r_y0": 227.13300000000004, "r_x1": 545.113, "r_y1": 227.13300000000004, "r_x2": 545.113, "r_y2": 219.40300000000002, "r_x3": 483.119, "r_y3": 219.40300000000002, "coord_origin": "TOPLEFT"}, "text": "Pattern Recogni-", "orig": "Pattern Recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 238.091, "r_x1": 519.398, "r_y1": 238.091, "r_x2": 519.398, "r_y2": 230.361, "r_x3": 328.781, "r_y3": 230.361, "coord_origin": "TOPLEFT"}, "text": "tion. ICPR International Workshops and Challenges", "orig": "tion. ICPR International Workshops and Challenges", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 519.401, "r_y0": 238.22000000000003, "r_x1": 521.643, "r_y1": 238.22000000000003, "r_x2": 521.643, "r_y2": 230.52300000000002, "r_x3": 519.401, "r_y3": 230.52300000000002, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 524.691, "r_y0": 238.22000000000003, "r_x1": 545.108, "r_y1": 238.22000000000003, "r_x2": 545.108, "r_y2": 230.52300000000002, "r_x3": 524.691, "r_y3": 230.52300000000002, "coord_origin": "TOPLEFT"}, "text": "pages", "orig": "pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 249.17899999999997, "r_x1": 545.113, "r_y1": 249.17899999999997, "r_x2": 545.113, "r_y2": 241.48199999999997, "r_x3": 328.781, "r_y3": 241.48199999999997, "coord_origin": "TOPLEFT"}, "text": "644-658, Cham, 2021. Springer International Publishing. 2,", "orig": "644-658, Cham, 2021. Springer International Publishing. 2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 260.13800000000003, "r_x1": 333.264, "r_y1": 260.13800000000003, "r_x2": 333.264, "r_y2": 252.44100000000003, "r_x3": 328.781, "r_y3": 252.44100000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 271.58399999999995, "r_x1": 323.8, "r_y1": 271.58399999999995, "r_x2": 323.8, "r_y2": 263.88699999999994, "r_x3": 308.862, "r_y3": 263.88699999999994, "coord_origin": "TOPLEFT"}, "text": "[19]", "orig": "[19]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 271.58399999999995, "r_x1": 545.109, "r_y1": 271.58399999999995, "r_x2": 545.109, "r_y2": 263.88699999999994, "r_x3": 328.785, "r_y3": 263.88699999999994, "coord_origin": "TOPLEFT"}, "text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 282.543, "r_x1": 545.113, "r_y1": 282.543, "r_x2": 545.113, "r_y2": 274.846, "r_x3": 328.781, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 293.502, "r_x1": 527.118, "r_y1": 293.502, "r_x2": 527.118, "r_y2": 285.805, "r_x3": 328.781, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar.", "orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 531.664, "r_y0": 293.502, "r_x1": 545.113, "r_y1": 293.502, "r_x2": 545.113, "r_y2": 285.805, "r_x3": 531.664, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Ro-", "orig": "Ro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 304.461, "r_x1": 343.549, "r_y1": 304.461, "r_x2": 343.549, "r_y2": 296.764, "r_x3": 328.781, "r_y3": 296.764, "coord_origin": "TOPLEFT"}, "text": "bust", "orig": "bust", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.44, "r_y0": 304.461, "r_x1": 545.113, "r_y1": 304.461, "r_x2": 545.113, "r_y2": 296.764, "r_x3": 347.44, "r_y3": 296.764, "coord_origin": "TOPLEFT"}, "text": "pdf document conversion using recurrent neural net-", "orig": "pdf document conversion using recurrent neural net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 315.419, "r_x1": 352.847, "r_y1": 315.419, "r_x2": 352.847, "r_y2": 307.722, "r_x3": 328.781, "r_y3": 307.722, "coord_origin": "TOPLEFT"}, "text": "works.", "orig": "works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.236, "r_y0": 315.29, "r_x1": 545.114, "r_y1": 315.29, "r_x2": 545.114, "r_y2": 307.56, "r_x3": 360.236, "r_y3": 307.56, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the AAAI Conference on Artificial", "orig": "Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 203, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 326.249, "r_x1": 371.022, "r_y1": 326.249, "r_x2": 371.022, "r_y2": 318.519, "r_x3": 328.781, "r_y3": 318.519, "coord_origin": "TOPLEFT"}, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 204, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 371.021, "r_y0": 326.378, "r_x1": 502.262, "r_y1": 326.378, "r_x2": 502.262, "r_y2": 318.681, "r_x3": 371.021, "r_y3": 318.681, "coord_origin": "TOPLEFT"}, "text": ", 35(17):15137-15145, May 2021. 1", "orig": ", 35(17):15137-15145, May 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 205, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 337.824, "r_x1": 323.8, "r_y1": 337.824, "r_x2": 323.8, "r_y2": 330.127, "r_x3": 308.862, "r_y3": 330.127, "coord_origin": "TOPLEFT"}, "text": "[20]", "orig": "[20]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 206, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 337.824, "r_x1": 545.109, "r_y1": 337.824, "r_x2": 545.109, "r_y2": 330.127, "r_x3": 328.785, "r_y3": 330.127, "coord_origin": "TOPLEFT"}, "text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 207, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 348.783, "r_x1": 456.821, "r_y1": 348.783, "r_x2": 456.821, "r_y2": 341.086, "r_x3": 328.781, "r_y3": 341.086, "coord_origin": "TOPLEFT"}, "text": "Yongpan Wang, and Gui-Song Xia.", "orig": "Yongpan Wang, and Gui-Song Xia.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 208, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 460.991, "r_y0": 348.783, "r_x1": 545.113, "r_y1": 348.783, "r_x2": 545.113, "r_y2": 341.086, "r_x3": 460.991, "r_y3": 341.086, "coord_origin": "TOPLEFT"}, "text": "Parsing table structures", "orig": "Parsing table structures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 209, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 359.742, "r_x1": 370.421, "r_y1": 359.742, "r_x2": 370.421, "r_y2": 352.045, "r_x3": 328.781, "r_y3": 352.045, "coord_origin": "TOPLEFT"}, "text": "in the wild.", "orig": "in the wild.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 210, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.308, "r_y0": 359.742, "r_x1": 382.777, "r_y1": 359.742, "r_x2": 382.777, "r_y2": 352.045, "r_x3": 375.308, "r_y3": 352.045, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 211, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.541, "r_y0": 359.613, "r_x1": 545.116, "r_y1": 359.613, "r_x2": 545.116, "r_y2": 351.883, "r_x3": 385.541, "r_y3": 351.883, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE/CVF International", "orig": "Proceedings of the IEEE/CVF International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 212, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 370.572, "r_x1": 443.596, "r_y1": 370.572, "r_x2": 443.596, "r_y2": 362.842, "r_x3": 328.781, "r_y3": 362.842, "coord_origin": "TOPLEFT"}, "text": "Conference on Computer Vision", "orig": "Conference on Computer Vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 213, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 443.594, "r_y0": 370.701, "r_x1": 534.486, "r_y1": 370.701, "r_x2": 534.486, "r_y2": 363.004, "r_x3": 443.594, "r_y3": 363.004, "coord_origin": "TOPLEFT"}, "text": ", pages 944-952, 2021. 2", "orig": ", pages 944-952, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 214, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 382.146, "r_x1": 323.8, "r_y1": 382.146, "r_x2": 323.8, "r_y2": 374.449, "r_x3": 308.862, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "[21]", "orig": "[21]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 215, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 382.146, "r_x1": 362.66, "r_y1": 382.146, "r_x2": 362.66, "r_y2": 374.449, "r_x3": 328.785, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Shubham", "orig": "Shubham", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 216, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 368.695, "r_y0": 382.146, "r_x1": 389.613, "r_y1": 382.146, "r_x2": 389.613, "r_y2": 374.449, "r_x3": 368.695, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Singh", "orig": "Singh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 217, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.648, "r_y0": 382.146, "r_x1": 424.564, "r_y1": 382.146, "r_x2": 424.564, "r_y2": 374.449, "r_x3": 395.648, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Paliwal,", "orig": "Paliwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 218, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.549, "r_y0": 382.146, "r_x1": 488.504, "r_y1": 382.146, "r_x2": 488.504, "r_y2": 374.449, "r_x3": 431.549, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "D Vishwanath,", "orig": "D Vishwanath,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 219, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 495.48, "r_y0": 382.146, "r_x1": 515.412, "r_y1": 382.146, "r_x2": 515.412, "r_y2": 374.449, "r_x3": 495.48, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Rohit", "orig": "Rohit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 220, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 521.446, "r_y0": 382.146, "r_x1": 545.109, "r_y1": 382.146, "r_x2": 545.109, "r_y2": 374.449, "r_x3": 521.446, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Rahul,", "orig": "Rahul,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 221, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 393.105, "r_x1": 460.318, "r_y1": 393.105, "r_x2": 460.318, "r_y2": 385.408, "r_x3": 328.781, "r_y3": 385.408, "coord_origin": "TOPLEFT"}, "text": "Monika Sharma, and Lovekesh Vig.", "orig": "Monika Sharma, and Lovekesh Vig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 222, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.393, "r_y0": 393.105, "r_x1": 498.542, "r_y1": 393.105, "r_x2": 498.542, "r_y2": 385.408, "r_x3": 465.393, "r_y3": 385.408, "coord_origin": "TOPLEFT"}, "text": "Tablenet:", "orig": "Tablenet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 223, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.469, "r_y0": 393.105, "r_x1": 545.113, "r_y1": 393.105, "r_x2": 545.113, "r_y2": 385.408, "r_x3": 502.469, "r_y3": 385.408, "coord_origin": "TOPLEFT"}, "text": "Deep learn-", "orig": "Deep learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 224, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 404.064, "r_x1": 545.113, "r_y1": 404.064, "r_x2": 545.113, "r_y2": 396.367, "r_x3": 328.781, "r_y3": 396.367, "coord_origin": "TOPLEFT"}, "text": "ing model for end-to-end table detection and tabular data ex-", "orig": "ing model for end-to-end table detection and tabular data ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 225, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 415.023, "r_x1": 478.009, "r_y1": 415.023, "r_x2": 478.009, "r_y2": 407.326, "r_x3": 328.781, "r_y3": 407.326, "coord_origin": "TOPLEFT"}, "text": "traction from scanned document images.", "orig": "traction from scanned document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 226, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 484.07, "r_y0": 415.023, "r_x1": 491.539, "r_y1": 415.023, "r_x2": 491.539, "r_y2": 407.326, "r_x3": 484.07, "r_y3": 407.326, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 227, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 494.668, "r_y0": 414.894, "r_x1": 545.113, "r_y1": 414.894, "r_x2": 545.113, "r_y2": 407.164, "r_x3": 494.668, "r_y3": 407.164, "coord_origin": "TOPLEFT"}, "text": "2019 Interna-", "orig": "2019 Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 228, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 425.853, "r_x1": 349.709, "r_y1": 425.853, "r_x2": 349.709, "r_y2": 418.123, "r_x3": 328.781, "r_y3": 418.123, "coord_origin": "TOPLEFT"}, "text": "tional", "orig": "tional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 229, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 353.295, "r_y0": 425.853, "r_x1": 545.113, "r_y1": 425.853, "r_x2": 545.113, "r_y2": 418.123, "r_x3": 353.295, "r_y3": 418.123, "coord_origin": "TOPLEFT"}, "text": "Conference on Document Analysis and Recognition", "orig": "Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 230, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 436.812, "r_x1": 360.836, "r_y1": 436.812, "r_x2": 360.836, "r_y2": 429.082, "r_x3": 328.781, "r_y3": 429.082, "coord_origin": "TOPLEFT"}, "text": "(ICDAR)", "orig": "(ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 231, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.836, "r_y0": 436.941, "r_x1": 475.633, "r_y1": 436.941, "r_x2": 475.633, "r_y2": 429.244, "r_x3": 360.836, "r_y3": 429.244, "coord_origin": "TOPLEFT"}, "text": ", pages 128-133. IEEE, 2019. 1", "orig": ", pages 128-133. IEEE, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 232, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 448.386, "r_x1": 323.8, "r_y1": 448.386, "r_x2": 323.8, "r_y2": 440.689, "r_x3": 308.862, "r_y3": 440.689, "coord_origin": "TOPLEFT"}, "text": "[22]", "orig": "[22]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 233, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 448.386, "r_x1": 545.109, "r_y1": 448.386, "r_x2": 545.109, "r_y2": 440.689, "r_x3": 328.785, "r_y3": 440.689, "coord_origin": "TOPLEFT"}, "text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 234, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 459.345, "r_x1": 545.113, "r_y1": 459.345, "r_x2": 545.113, "r_y2": 451.648, "r_x3": 328.781, "r_y3": 451.648, "coord_origin": "TOPLEFT"}, "text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 235, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 470.304, "r_x1": 343.477, "r_y1": 470.304, "r_x2": 343.477, "r_y2": 462.607, "r_x3": 328.781, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Lin,", "orig": "Lin,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 236, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.601, "r_y0": 470.304, "r_x1": 373.496, "r_y1": 470.304, "r_x2": 373.496, "r_y2": 462.607, "r_x3": 347.601, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Natalia", "orig": "Natalia", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 237, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.244, "r_y0": 470.304, "r_x1": 420.83, "r_y1": 470.304, "r_x2": 420.83, "r_y2": 462.607, "r_x3": 377.244, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Gimelshein,", "orig": "Gimelshein,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 238, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.955, "r_y0": 470.304, "r_x1": 473.239, "r_y1": 470.304, "r_x2": 473.239, "r_y2": 462.607, "r_x3": 424.955, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Luca Antiga,", "orig": "Luca Antiga,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 239, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.363, "r_y0": 470.304, "r_x1": 545.113, "r_y1": 470.304, "r_x2": 545.113, "r_y2": 462.607, "r_x3": 477.363, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Alban Desmaison,", "orig": "Alban Desmaison,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 240, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 481.263, "r_x1": 545.113, "r_y1": 481.263, "r_x2": 545.113, "r_y2": 473.566, "r_x3": 328.781, "r_y3": 473.566, "coord_origin": "TOPLEFT"}, "text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 241, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 492.222, "r_x1": 545.113, "r_y1": 492.222, "r_x2": 545.113, "r_y2": 484.525, "r_x3": 328.781, "r_y3": 484.525, "coord_origin": "TOPLEFT"}, "text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 242, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 503.181, "r_x1": 545.113, "r_y1": 503.181, "r_x2": 545.113, "r_y2": 495.484, "r_x3": 328.781, "r_y3": 495.484, "coord_origin": "TOPLEFT"}, "text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 243, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 514.14, "r_x1": 545.113, "r_y1": 514.14, "r_x2": 545.113, "r_y2": 506.443, "r_x3": 328.781, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "perative style, high-performance deep learning library. In H.", "orig": "perative style, high-performance deep learning library. In H.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 244, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 525.0989999999999, "r_x1": 545.11, "r_y1": 525.0989999999999, "r_x2": 545.11, "r_y2": 517.402, "r_x3": 328.781, "r_y3": 517.402, "coord_origin": "TOPLEFT"}, "text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4-Buc, E.", "orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4-Buc, E.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 245, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 511.145, "r_y0": 525.0989999999999, "r_x1": 515.126, "r_y1": 525.0989999999999, "r_x2": 515.126, "r_y2": 517.402, "r_x3": 511.145, "r_y3": 517.402, "coord_origin": "TOPLEFT"}, "text": "e", "orig": "e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 246, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 536.057, "r_x1": 434.567, "r_y1": 536.057, "r_x2": 434.567, "r_y2": 528.36, "r_x3": 328.781, "r_y3": 528.36, "coord_origin": "TOPLEFT"}, "text": "Fox, and R. Garnett, editors,", "orig": "Fox, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 247, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.864, "r_y0": 535.928, "r_x1": 545.111, "r_y1": 535.928, "r_x2": 545.111, "r_y2": 528.198, "r_x3": 437.864, "r_y3": 528.198, "coord_origin": "TOPLEFT"}, "text": "Advances in Neural Informa-", "orig": "Advances in Neural Informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 248, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 546.887, "r_x1": 425.735, "r_y1": 546.887, "r_x2": 425.735, "r_y2": 539.157, "r_x3": 328.781, "r_y3": 539.157, "coord_origin": "TOPLEFT"}, "text": "tion Processing Systems 32", "orig": "tion Processing Systems 32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 249, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 425.736, "r_y0": 547.016, "r_x1": 545.115, "r_y1": 547.016, "r_x2": 545.115, "r_y2": 539.319, "r_x3": 425.736, "r_y3": 539.319, "coord_origin": "TOPLEFT"}, "text": ", pages 8024-8035. Curran Asso-", "orig": ", pages 8024-8035. Curran Asso-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 250, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 557.975, "r_x1": 399.741, "r_y1": 557.975, "r_x2": 399.741, "r_y2": 550.278, "r_x3": 328.781, "r_y3": 550.278, "coord_origin": "TOPLEFT"}, "text": "ciates, Inc., 2019. 6", "orig": "ciates, Inc., 2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 251, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.421, "r_x1": 323.8, "r_y1": 569.421, "r_x2": 323.8, "r_y2": 561.7239999999999, "r_x3": 308.862, "r_y3": 561.7239999999999, "coord_origin": "TOPLEFT"}, "text": "[23]", "orig": "[23]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 252, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 569.421, "r_x1": 395.433, "r_y1": 569.421, "r_x2": 395.433, "r_y2": 561.7239999999999, "r_x3": 328.785, "r_y3": 561.7239999999999, "coord_origin": "TOPLEFT"}, "text": "Devashish Prasad,", "orig": "Devashish Prasad,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 253, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 399.369, "r_y0": 569.421, "r_x1": 545.109, "r_y1": 569.421, "r_x2": 545.109, "r_y2": 561.7239999999999, "r_x3": 399.369, "r_y3": 561.7239999999999, "coord_origin": "TOPLEFT"}, "text": "Ayan Gadpal, Kshitij Kapadni, Manish", "orig": "Ayan Gadpal, Kshitij Kapadni, Manish", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 254, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 580.38, "r_x1": 545.113, "r_y1": 580.38, "r_x2": 545.113, "r_y2": 572.683, "r_x3": 328.781, "r_y3": 572.683, "coord_origin": "TOPLEFT"}, "text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 255, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 591.3389999999999, "r_x1": 545.113, "r_y1": 591.3389999999999, "r_x2": 545.113, "r_y2": 583.642, "r_x3": 328.781, "r_y3": 583.642, "coord_origin": "TOPLEFT"}, "text": "for end to end table detection and structure recognition from", "orig": "for end to end table detection and structure recognition from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 256, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 602.298, "r_x1": 418.266, "r_y1": 602.298, "r_x2": 418.266, "r_y2": 594.601, "r_x3": 328.781, "r_y3": 594.601, "coord_origin": "TOPLEFT"}, "text": "image-based documents.", "orig": "image-based documents.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 257, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.148, "r_y0": 602.298, "r_x1": 431.617, "r_y1": 602.298, "r_x2": 431.617, "r_y2": 594.601, "r_x3": 424.148, "r_y3": 594.601, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 258, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 434.691, "r_y0": 602.169, "r_x1": 545.112, "r_y1": 602.169, "r_x2": 545.112, "r_y2": 594.439, "r_x3": 434.691, "r_y3": 594.439, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE/CVF", "orig": "Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 259, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 613.127, "r_x1": 369.784, "r_y1": 613.127, "r_x2": 369.784, "r_y2": 605.3969999999999, "r_x3": 328.781, "r_y3": 605.3969999999999, "coord_origin": "TOPLEFT"}, "text": "Conference", "orig": "Conference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 260, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.008, "r_y0": 613.127, "r_x1": 449.549, "r_y1": 613.127, "r_x2": 449.549, "r_y2": 605.3969999999999, "r_x3": 374.008, "r_y3": 605.3969999999999, "coord_origin": "TOPLEFT"}, "text": "on Computer Vision", "orig": "on Computer Vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 261, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.782, "r_y0": 613.127, "r_x1": 497.636, "r_y1": 613.127, "r_x2": 497.636, "r_y2": 605.3969999999999, "r_x3": 453.782, "r_y3": 605.3969999999999, "coord_origin": "TOPLEFT"}, "text": "and Pattern", "orig": "and Pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 262, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 501.868, "r_y0": 613.127, "r_x1": 545.113, "r_y1": 613.127, "r_x2": 545.113, "r_y2": 605.3969999999999, "r_x3": 501.868, "r_y3": 605.3969999999999, "coord_origin": "TOPLEFT"}, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 263, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 624.086, "r_x1": 367.803, "r_y1": 624.086, "r_x2": 367.803, "r_y2": 616.356, "r_x3": 328.781, "r_y3": 616.356, "coord_origin": "TOPLEFT"}, "text": "Workshops", "orig": "Workshops", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 264, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.802, "r_y0": 624.215, "r_x1": 458.694, "r_y1": 624.215, "r_x2": 458.694, "r_y2": 616.518, "r_x3": 367.802, "r_y3": 616.518, "coord_origin": "TOPLEFT"}, "text": ", pages 572-573, 2020. 1", "orig": ", pages 572-573, 2020. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 265, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 635.6610000000001, "r_x1": 323.8, "r_y1": 635.6610000000001, "r_x2": 323.8, "r_y2": 627.9639999999999, "r_x3": 308.862, "r_y3": 627.9639999999999, "coord_origin": "TOPLEFT"}, "text": "[24]", "orig": "[24]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 266, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 635.6610000000001, "r_x1": 545.109, "r_y1": 635.6610000000001, "r_x2": 545.109, "r_y2": 627.9639999999999, "r_x3": 328.785, "r_y3": 627.9639999999999, "coord_origin": "TOPLEFT"}, "text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 267, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 646.62, "r_x1": 545.113, "r_y1": 646.62, "r_x2": 545.113, "r_y2": 638.923, "r_x3": 328.781, "r_y3": 638.923, "coord_origin": "TOPLEFT"}, "text": "Rethinking table recognition using graph neural networks.", "orig": "Rethinking table recognition using graph neural networks.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 268, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 657.579, "r_x1": 336.25, "r_y1": 657.579, "r_x2": 336.25, "r_y2": 649.8820000000001, "r_x3": 328.781, "r_y3": 649.8820000000001, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 269, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.1, "r_y0": 657.45, "r_x1": 545.116, "r_y1": 657.45, "r_x2": 545.116, "r_y2": 649.72, "r_x3": 338.1, "r_y3": 649.72, "coord_origin": "TOPLEFT"}, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 270, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 668.409, "r_x1": 406.322, "r_y1": 668.409, "r_x2": 406.322, "r_y2": 660.679, "r_x3": 328.781, "r_y3": 660.679, "coord_origin": "TOPLEFT"}, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 271, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 406.322, "r_y0": 668.538, "r_x1": 521.119, "r_y1": 668.538, "r_x2": 521.119, "r_y2": 660.841, "r_x3": 406.322, "r_y3": 660.841, "coord_origin": "TOPLEFT"}, "text": ", pages 142-147. IEEE, 2019. 3", "orig": ", pages 142-147. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 272, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 679.983, "r_x1": 323.8, "r_y1": 679.983, "r_x2": 323.8, "r_y2": 672.2860000000001, "r_x3": 308.862, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "[25]", "orig": "[25]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 273, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 679.983, "r_x1": 400.857, "r_y1": 679.983, "r_x2": 400.857, "r_y2": 672.2860000000001, "r_x3": 328.785, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "Hamid Rezatofighi,", "orig": "Hamid Rezatofighi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 274, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 405.403, "r_y0": 679.983, "r_x1": 453.571, "r_y1": 679.983, "r_x2": 453.571, "r_y2": 672.2860000000001, "r_x3": 405.403, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "Nathan Tsoi,", "orig": "Nathan Tsoi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 275, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.117, "r_y0": 679.983, "r_x1": 521.635, "r_y1": 679.983, "r_x2": 521.635, "r_y2": 672.2860000000001, "r_x3": 458.117, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "JunYoung Gwak,", "orig": "JunYoung Gwak,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 276, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 526.181, "r_y0": 679.983, "r_x1": 545.109, "r_y1": 679.983, "r_x2": 545.109, "r_y2": 672.2860000000001, "r_x3": 526.181, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "Amir", "orig": "Amir", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 277, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 690.942, "r_x1": 482.815, "r_y1": 690.942, "r_x2": 482.815, "r_y2": 683.245, "r_x3": 328.781, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "Sadeghian, Ian Reid, and Silvio Savarese.", "orig": "Sadeghian, Ian Reid, and Silvio Savarese.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 278, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.751, "r_y0": 690.942, "r_x1": 545.113, "r_y1": 690.942, "r_x2": 545.113, "r_y2": 683.245, "r_x3": 488.751, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "Generalized in-", "orig": "Generalized in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 279, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 701.901, "r_x1": 545.113, "r_y1": 701.901, "r_x2": 545.113, "r_y2": 694.204, "r_x3": 328.781, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "tersection over union: A metric and a loss for bounding box", "orig": "tersection over union: A metric and a loss for bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 280, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 712.86, "r_x1": 367.74, "r_y1": 712.86, "r_x2": 367.74, "r_y2": 705.163, "r_x3": 328.781, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "regression.", "orig": "regression.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 281, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 371.685, "r_y0": 712.86, "r_x1": 379.154, "r_y1": 712.86, "r_x2": 379.154, "r_y2": 705.163, "r_x3": 371.685, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 282, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 381.616, "r_y0": 712.731, "r_x1": 545.109, "r_y1": 712.731, "r_x2": 545.109, "r_y2": 705.001, "r_x3": 381.616, "r_y3": 705.001, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE/CVF Conference on", "orig": "Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 283, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 25, "label": "list_item", "bbox": {"l": 70.031, "t": 76.12599999999998, "r": 286.363, "b": 116.69899999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.7310384511947632, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 83.82299999999998, "r_x1": 212.373, "r_y1": 83.82299999999998, "r_x2": 212.373, "r_y2": 76.12599999999998, "r_x3": 70.031, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "end object detection with transformers.", "orig": "end object detection with transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.313, "r_y0": 83.82299999999998, "r_x1": 286.363, "r_y1": 83.82299999999998, "r_x2": 286.363, "r_y2": 76.12599999999998, "r_x3": 217.313, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "In Andrea Vedaldi,", "orig": "In Andrea Vedaldi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 94.78200000000004, "r_x1": 286.363, "r_y1": 94.78200000000004, "r_x2": 286.363, "r_y2": 87.08500000000004, "r_x3": 70.031, "r_y3": 87.08500000000004, "coord_origin": "TOPLEFT"}, "text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 105.74000000000001, "r_x1": 85.722, "r_y1": 105.74000000000001, "r_x2": 85.722, "r_y2": 98.043, "r_x3": 70.031, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "tors,", "orig": "tors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.889, "r_y0": 105.61099999999999, "r_x1": 199.933, "r_y1": 105.61099999999999, "r_x2": 199.933, "r_y2": 97.88099999999997, "r_x3": 87.889, "r_y3": 97.88099999999997, "coord_origin": "TOPLEFT"}, "text": "Computer Vision - ECCV 2020", "orig": "Computer Vision - ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.936, "r_y0": 105.74000000000001, "r_x1": 286.363, "r_y1": 105.74000000000001, "r_x2": 286.363, "r_y2": 98.043, "r_x3": 199.936, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": ", pages 213-229, Cham,", "orig": ", pages 213-229, Cham,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 116.69899999999996, "r_x1": 221.949, "r_y1": 116.69899999999996, "r_x2": 221.949, "r_y2": 109.00199999999995, "r_x3": 70.031, "r_y3": 109.00199999999995, "coord_origin": "TOPLEFT"}, "text": "2020. Springer International Publishing. 5", "orig": "2020. Springer International Publishing. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "list_item", "bbox": {"l": 54.595, "t": 120.274, "r": 286.363, "b": 149.889, "coord_origin": "TOPLEFT"}, "confidence": 0.9372755885124207, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 127.971, "r_x1": 65.05, "r_y1": 127.971, "r_x2": 65.05, "r_y2": 120.274, "r_x3": 54.595, "r_y3": 120.274, "coord_origin": "TOPLEFT"}, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 127.971, "r_x1": 286.359, "r_y1": 127.971, "r_x2": 286.359, "r_y2": 120.274, "r_x3": 70.035, "r_y3": 120.274, "coord_origin": "TOPLEFT"}, "text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 138.92999999999995, "r_x1": 179.672, "r_y1": 138.92999999999995, "r_x2": 179.672, "r_y2": 131.23299999999995, "r_x3": 70.031, "r_y3": 131.23299999999995, "coord_origin": "TOPLEFT"}, "text": "uan Yin, and Xian-Ling Mao.", "orig": "uan Yin, and Xian-Ling Mao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.581, "r_y0": 138.92999999999995, "r_x1": 286.363, "r_y1": 138.92999999999995, "r_x2": 286.363, "r_y2": 131.23299999999995, "r_x3": 185.581, "r_y3": 131.23299999999995, "coord_origin": "TOPLEFT"}, "text": "Complicated table structure", "orig": "Complicated table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 149.889, "r_x1": 113.115, "r_y1": 149.889, "r_x2": 113.115, "r_y2": 142.192, "r_x3": 70.031, "r_y3": 142.192, "coord_origin": "TOPLEFT"}, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.342, "r_y0": 149.76, "r_x1": 235.308, "r_y1": 149.76, "r_x2": 235.308, "r_y2": 142.02999999999997, "r_x3": 116.342, "r_y3": 142.02999999999997, "coord_origin": "TOPLEFT"}, "text": "arXiv preprint arXiv:1908.04729", "orig": "arXiv preprint arXiv:1908.04729", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.307, "r_y0": 149.889, "r_x1": 267.676, "r_y1": 149.889, "r_x2": 267.676, "r_y2": 142.192, "r_x3": 235.307, "r_y3": 142.192, "coord_origin": "TOPLEFT"}, "text": ", 2019. 3", "orig": ", 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "list_item", "bbox": {"l": 54.595, "t": 153.30200000000002, "r": 286.363, "b": 183.07799999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.9378374218940735, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 161.16099999999994, "r_x1": 65.05, "r_y1": 161.16099999999994, "r_x2": 65.05, "r_y2": 153.46400000000006, "r_x3": 54.595, "r_y3": 153.46400000000006, "coord_origin": "TOPLEFT"}, "text": "[3]", "orig": "[3]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 161.16099999999994, "r_x1": 218.779, "r_y1": 161.16099999999994, "r_x2": 218.779, "r_y2": 153.46400000000006, "r_x3": 70.035, "r_y3": 153.46400000000006, "coord_origin": "TOPLEFT"}, "text": "Bertrand Couasnon and Aurelie Lemaitre.", "orig": "Bertrand Couasnon and Aurelie Lemaitre.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.98, "r_y0": 161.03200000000004, "r_x1": 286.363, "r_y1": 161.03200000000004, "r_x2": 286.363, "r_y2": 153.30200000000002, "r_x3": 220.98, "r_y3": 153.30200000000002, "coord_origin": "TOPLEFT"}, "text": "Recognition of Ta-", "orig": "Recognition of Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 171.99099999999999, "r_x1": 125.264, "r_y1": 171.99099999999999, "r_x2": 125.264, "r_y2": 164.26099999999997, "r_x3": 70.031, "r_y3": 164.26099999999997, "coord_origin": "TOPLEFT"}, "text": "bles and Forms", "orig": "bles and Forms", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.261, "r_y0": 172.12, "r_x1": 127.503, "r_y1": 172.12, "r_x2": 127.503, "r_y2": 164.423, "r_x3": 125.261, "r_y3": 164.423, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.986, "r_y0": 172.12, "r_x1": 286.36, "r_y1": 172.12, "r_x2": 286.36, "r_y2": 164.423, "r_x3": 129.986, "r_y3": 164.423, "coord_origin": "TOPLEFT"}, "text": "pages 647-677. Springer London, London,", "orig": "pages 647-677. Springer London, London,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 183.07799999999997, "r_x1": 97.917, "r_y1": 183.07799999999997, "r_x2": 97.917, "r_y2": 175.38099999999997, "r_x3": 70.031, "r_y3": 175.38099999999997, "coord_origin": "TOPLEFT"}, "text": "2014. 2", "orig": "2014. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "list_item", "bbox": {"l": 54.595, "t": 186.65300000000002, "r": 286.364, "b": 227.22699999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9648825526237488, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 194.35000000000002, "r_x1": 65.05, "r_y1": 194.35000000000002, "r_x2": 65.05, "r_y2": 186.65300000000002, "r_x3": 54.595, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "[4]", "orig": "[4]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 194.35000000000002, "r_x1": 91.936, "r_y1": 194.35000000000002, "r_x2": 91.936, "r_y2": 186.65300000000002, "r_x3": 70.035, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Herv\u00b4 e", "orig": "Herv\u00b4 e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 97.101, "r_y0": 194.35000000000002, "r_x1": 124.736, "r_y1": 194.35000000000002, "r_x2": 124.736, "r_y2": 186.65300000000002, "r_x3": 97.101, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "D\u00b4jean,", "orig": "D\u00b4jean,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.575, "r_y0": 194.35000000000002, "r_x1": 107.556, "r_y1": 194.35000000000002, "r_x2": 107.556, "r_y2": 186.65300000000002, "r_x3": 103.575, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "e", "orig": "e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 130.636, "r_y0": 194.35000000000002, "r_x1": 163.497, "r_y1": 194.35000000000002, "r_x2": 163.497, "r_y2": 186.65300000000002, "r_x3": 130.636, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Jean-Luc", "orig": "Jean-Luc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.662, "r_y0": 194.35000000000002, "r_x1": 200.923, "r_y1": 194.35000000000002, "r_x2": 200.923, "r_y2": 186.65300000000002, "r_x3": 168.662, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Meunier,", "orig": "Meunier,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.814, "r_y0": 194.35000000000002, "r_x1": 238.188, "r_y1": 194.35000000000002, "r_x2": 238.188, "r_y2": 186.65300000000002, "r_x3": 206.814, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Liangcai", "orig": "Liangcai", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.352, "r_y0": 194.35000000000002, "r_x1": 260.532, "r_y1": 194.35000000000002, "r_x2": 260.532, "r_y2": 186.65300000000002, "r_x3": 243.352, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Gao,", "orig": "Gao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.432, "r_y0": 194.35000000000002, "r_x1": 286.364, "r_y1": 194.35000000000002, "r_x2": 286.364, "r_y2": 186.65300000000002, "r_x3": 266.432, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Yilun", "orig": "Yilun", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 205.30899999999997, "r_x1": 269.605, "r_y1": 205.30899999999997, "r_x2": 269.605, "r_y2": 197.61199999999997, "r_x3": 70.031, "r_y3": 197.61199999999997, "coord_origin": "TOPLEFT"}, "text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang.", "orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.411, "r_y0": 205.30899999999997, "r_x1": 286.363, "r_y1": 205.30899999999997, "r_x2": 286.363, "r_y2": 197.61199999999997, "r_x3": 274.411, "r_y3": 197.61199999999997, "coord_origin": "TOPLEFT"}, "text": "IC-", "orig": "IC-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 216.26800000000003, "r_x1": 286.363, "r_y1": 216.26800000000003, "r_x2": 286.363, "r_y2": 208.57100000000003, "r_x3": 70.031, "r_y3": 208.57100000000003, "coord_origin": "TOPLEFT"}, "text": "DAR 2019 Competition on Table Detection and Recognition", "orig": "DAR 2019 Competition on Table Detection and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 227.22699999999998, "r_x1": 245.835, "r_y1": 227.22699999999998, "r_x2": 245.835, "r_y2": 219.52999999999997, "r_x3": 70.031, "r_y3": 219.52999999999997, "coord_origin": "TOPLEFT"}, "text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "list_item", "bbox": {"l": 54.595, "t": 230.80200000000002, "r": 286.363, "b": 271.375, "coord_origin": "TOPLEFT"}, "confidence": 0.9620943069458008, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 238.49900000000002, "r_x1": 65.05, "r_y1": 238.49900000000002, "r_x2": 65.05, "r_y2": 230.80200000000002, "r_x3": 54.595, "r_y3": 230.80200000000002, "coord_origin": "TOPLEFT"}, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 238.49900000000002, "r_x1": 286.359, "r_y1": 238.49900000000002, "r_x2": 286.359, "r_y2": 230.80200000000002, "r_x3": 70.035, "r_y3": 230.80200000000002, "coord_origin": "TOPLEFT"}, "text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 249.45799999999997, "r_x1": 286.363, "r_y1": 249.45799999999997, "r_x2": 286.363, "r_y2": 241.76099999999997, "r_x3": 70.031, "r_y3": 241.76099999999997, "coord_origin": "TOPLEFT"}, "text": "Stavros J Perantonis. Automatic table detection in document", "orig": "Stavros J Perantonis. Automatic table detection in document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 260.41600000000005, "r_x1": 108.398, "r_y1": 260.41600000000005, "r_x2": 108.398, "r_y2": 252.71900000000005, "r_x3": 70.031, "r_y3": 252.71900000000005, "coord_origin": "TOPLEFT"}, "text": "images. In", "orig": "images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.645, "r_y0": 260.28700000000003, "r_x1": 286.36, "r_y1": 260.28700000000003, "r_x2": 286.36, "r_y2": 252.55700000000002, "r_x3": 110.645, "r_y3": 252.55700000000002, "coord_origin": "TOPLEFT"}, "text": "International Conference on Pattern Recognition", "orig": "International Conference on Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 271.246, "r_x1": 140.579, "r_y1": 271.246, "r_x2": 140.579, "r_y2": 263.51599999999996, "r_x3": 70.031, "r_y3": 263.51599999999996, "coord_origin": "TOPLEFT"}, "text": "and Image Analysis", "orig": "and Image Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.578, "r_y0": 271.375, "r_x1": 266.475, "r_y1": 271.375, "r_x2": 266.475, "r_y2": 263.678, "r_x3": 140.578, "r_y3": 263.678, "coord_origin": "TOPLEFT"}, "text": ", pages 609-618. Springer, 2005. 2", "orig": ", pages 609-618. Springer, 2005. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "list_item", "bbox": {"l": 54.595, "t": 274.95000000000005, "r": 286.367, "b": 315.524, "coord_origin": "TOPLEFT"}, "confidence": 0.9555517435073853, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 282.647, "r_x1": 65.05, "r_y1": 282.647, "r_x2": 65.05, "r_y2": 274.95000000000005, "r_x3": 54.595, "r_y3": 274.95000000000005, "coord_origin": "TOPLEFT"}, "text": "[6]", "orig": "[6]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 282.647, "r_x1": 286.367, "r_y1": 282.647, "r_x2": 286.367, "r_y2": 274.95000000000005, "r_x3": 70.035, "r_y3": 274.95000000000005, "coord_origin": "TOPLEFT"}, "text": "MaxG\u00a8bel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "orig": "MaxG\u00a8bel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.719, "r_y0": 282.647, "r_x1": 99.202, "r_y1": 282.647, "r_x2": 99.202, "r_y2": 274.95000000000005, "r_x3": 94.719, "r_y3": 274.95000000000005, "coord_origin": "TOPLEFT"}, "text": "o", "orig": "o", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 293.606, "r_x1": 179.574, "r_y1": 293.606, "r_x2": 179.574, "r_y2": 285.909, "r_x3": 70.031, "r_y3": 285.909, "coord_origin": "TOPLEFT"}, "text": "Icdar 2013 table competition.", "orig": "Icdar 2013 table competition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.016, "r_y0": 293.606, "r_x1": 194.485, "r_y1": 293.606, "r_x2": 194.485, "r_y2": 285.909, "r_x3": 187.016, "r_y3": 285.909, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.044, "r_y0": 293.477, "r_x1": 286.363, "r_y1": 293.477, "r_x2": 286.363, "r_y2": 285.747, "r_x3": 198.044, "r_y3": 285.747, "coord_origin": "TOPLEFT"}, "text": "2013 12th International", "orig": "2013 12th International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 304.436, "r_x1": 260.199, "r_y1": 304.436, "r_x2": 260.199, "r_y2": 296.706, "r_x3": 70.031, "r_y3": 296.706, "coord_origin": "TOPLEFT"}, "text": "Conference on Document Analysis and Recognition", "orig": "Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 260.198, "r_y0": 304.565, "r_x1": 262.44, "r_y1": 304.565, "r_x2": 262.44, "r_y2": 296.868, "r_x3": 260.198, "r_y3": 296.868, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.945, "r_y0": 304.565, "r_x1": 286.362, "r_y1": 304.565, "r_x2": 286.362, "r_y2": 296.868, "r_x3": 265.945, "r_y3": 296.868, "coord_origin": "TOPLEFT"}, "text": "pages", "orig": "pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 315.524, "r_x1": 142.749, "r_y1": 315.524, "r_x2": 142.749, "r_y2": 307.827, "r_x3": 70.031, "r_y3": 307.827, "coord_origin": "TOPLEFT"}, "text": "1449-1453, 2013. 2", "orig": "1449-1453, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "list_item", "bbox": {"l": 54.595, "t": 319.099, "r": 286.363, "b": 348.713, "coord_origin": "TOPLEFT"}, "confidence": 0.9479843378067017, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 326.796, "r_x1": 65.05, "r_y1": 326.796, "r_x2": 65.05, "r_y2": 319.099, "r_x3": 54.595, "r_y3": 319.099, "coord_origin": "TOPLEFT"}, "text": "[7]", "orig": "[7]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 326.796, "r_x1": 199.492, "r_y1": 326.796, "r_x2": 199.492, "r_y2": 319.099, "r_x3": 70.035, "r_y3": 319.099, "coord_origin": "TOPLEFT"}, "text": "EA Green and M Krishnamoorthy.", "orig": "EA Green and M Krishnamoorthy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.988, "r_y0": 326.796, "r_x1": 286.359, "r_y1": 326.796, "r_x2": 286.359, "r_y2": 319.099, "r_x3": 206.988, "r_y3": 319.099, "coord_origin": "TOPLEFT"}, "text": "Recognition of tables", "orig": "Recognition of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 337.754, "r_x1": 176.283, "r_y1": 337.754, "r_x2": 176.283, "r_y2": 330.057, "r_x3": 70.031, "r_y3": 330.057, "coord_origin": "TOPLEFT"}, "text": "using table grammars. procs.", "orig": "using table grammars. procs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.604, "r_y0": 337.754, "r_x1": 190.073, "r_y1": 337.754, "r_x2": 190.073, "r_y2": 330.057, "r_x3": 182.604, "r_y3": 330.057, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.283, "r_y0": 337.625, "r_x1": 286.363, "r_y1": 337.625, "r_x2": 286.363, "r_y2": 329.895, "r_x3": 193.283, "r_y3": 329.895, "coord_origin": "TOPLEFT"}, "text": "Symposium on Document", "orig": "Symposium on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 348.584, "r_x1": 206.347, "r_y1": 348.584, "r_x2": 206.347, "r_y2": 340.854, "r_x3": 70.031, "r_y3": 340.854, "coord_origin": "TOPLEFT"}, "text": "Analysis and Recognition (SDAIR'95)", "orig": "Analysis and Recognition (SDAIR'95)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.346, "r_y0": 348.713, "r_x1": 274.822, "r_y1": 348.713, "r_x2": 274.822, "r_y2": 341.016, "r_x3": 206.346, "r_y3": 341.016, "coord_origin": "TOPLEFT"}, "text": ", pages 261-277. 2", "orig": ", pages 261-277. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "list_item", "bbox": {"l": 54.595, "t": 352.288, "r": 286.363, "b": 403.821, "coord_origin": "TOPLEFT"}, "confidence": 0.9484425187110901, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 359.985, "r_x1": 65.05, "r_y1": 359.985, "r_x2": 65.05, "r_y2": 352.288, "r_x3": 54.595, "r_y3": 352.288, "coord_origin": "TOPLEFT"}, "text": "[8]", "orig": "[8]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 359.985, "r_x1": 286.359, "r_y1": 359.985, "r_x2": 286.359, "r_y2": 352.288, "r_x3": 70.035, "r_y3": 352.288, "coord_origin": "TOPLEFT"}, "text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 370.944, "r_x1": 234.125, "r_y1": 370.944, "r_x2": 234.125, "r_y2": 363.247, "r_x3": 70.031, "r_y3": 363.247, "coord_origin": "TOPLEFT"}, "text": "dier Stricker, and Muhammad Zeshan Afzal.", "orig": "dier Stricker, and Muhammad Zeshan Afzal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.052, "r_y0": 370.944, "r_x1": 286.363, "r_y1": 370.944, "r_x2": 286.363, "r_y2": 363.247, "r_x3": 240.052, "r_y3": 363.247, "coord_origin": "TOPLEFT"}, "text": "Castabdetec-", "orig": "Castabdetec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 381.903, "r_x1": 85.973, "r_y1": 381.903, "r_x2": 85.973, "r_y2": 374.206, "r_x3": 70.031, "r_y3": 374.206, "coord_origin": "TOPLEFT"}, "text": "tors:", "orig": "tors:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 90.349, "r_y0": 381.903, "r_x1": 286.363, "r_y1": 381.903, "r_x2": 286.363, "r_y2": 374.206, "r_x3": 90.349, "r_y3": 374.206, "coord_origin": "TOPLEFT"}, "text": "Cascade network for table detection in document im-", "orig": "Cascade network for table detection in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 392.862, "r_x1": 286.363, "r_y1": 392.862, "r_x2": 286.363, "r_y2": 385.165, "r_x3": 70.031, "r_y3": 385.165, "coord_origin": "TOPLEFT"}, "text": "ages with recursive feature pyramid and switchable atrous", "orig": "ages with recursive feature pyramid and switchable atrous", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 403.821, "r_x1": 114.576, "r_y1": 403.821, "r_x2": 114.576, "r_y2": 396.124, "r_x3": 70.031, "r_y3": 396.124, "coord_origin": "TOPLEFT"}, "text": "convolution.", "orig": "convolution.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 117.804, "r_y0": 403.692, "r_x1": 186.729, "r_y1": 403.692, "r_x2": 186.729, "r_y2": 395.962, "r_x3": 117.804, "r_y3": 395.962, "coord_origin": "TOPLEFT"}, "text": "Journal of Imaging", "orig": "Journal of Imaging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 186.728, "r_y0": 403.821, "r_x1": 243.001, "r_y1": 403.821, "r_x2": 243.001, "r_y2": 396.124, "r_x3": 186.728, "r_y3": 396.124, "coord_origin": "TOPLEFT"}, "text": ", 7(10), 2021. 1", "orig": ", 7(10), 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 10, "label": "list_item", "bbox": {"l": 54.595, "t": 407.395, "r": 286.36, "b": 437.01, "coord_origin": "TOPLEFT"}, "confidence": 0.9330756664276123, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 415.092, "r_x1": 65.05, "r_y1": 415.092, "r_x2": 65.05, "r_y2": 407.395, "r_x3": 54.595, "r_y3": 407.395, "coord_origin": "TOPLEFT"}, "text": "[9]", "orig": "[9]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 415.092, "r_x1": 286.359, "r_y1": 415.092, "r_x2": 286.359, "r_y2": 407.395, "r_x3": 70.035, "r_y3": 407.395, "coord_origin": "TOPLEFT"}, "text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 426.051, "r_x1": 147.133, "r_y1": 426.051, "r_x2": 147.133, "r_y2": 418.354, "r_x3": 70.031, "r_y3": 418.354, "coord_origin": "TOPLEFT"}, "text": "shick. Mask r-cnn. In", "orig": "shick. Mask r-cnn. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.156, "r_y0": 425.922, "r_x1": 286.36, "r_y1": 425.922, "r_x2": 286.36, "r_y2": 418.192, "r_x3": 149.156, "r_y3": 418.192, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE International", "orig": "Proceedings of the IEEE International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 436.881, "r_x1": 213.484, "r_y1": 436.881, "r_x2": 213.484, "r_y2": 429.151, "r_x3": 70.031, "r_y3": 429.151, "coord_origin": "TOPLEFT"}, "text": "Conference on Computer Vision (ICCV)", "orig": "Conference on Computer Vision (ICCV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 213.483, "r_y0": 437.01, "r_x1": 261.041, "r_y1": 437.01, "r_x2": 261.041, "r_y2": 429.313, "r_x3": 213.483, "r_y3": 429.313, "coord_origin": "TOPLEFT"}, "text": ", Oct 2017. 1", "orig": ", Oct 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "list_item", "bbox": {"l": 50.112, "t": 440.585, "r": 286.363, "b": 481.159, "coord_origin": "TOPLEFT"}, "confidence": 0.9274735450744629, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 448.282, "r_x1": 65.05, "r_y1": 448.282, "r_x2": 65.05, "r_y2": 440.585, "r_x3": 50.112, "r_y3": 440.585, "coord_origin": "TOPLEFT"}, "text": "[10]", "orig": "[10]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 448.282, "r_x1": 286.359, "r_y1": 448.282, "r_x2": 286.359, "r_y2": 440.585, "r_x3": 70.035, "r_y3": 440.585, "coord_origin": "TOPLEFT"}, "text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 459.241, "r_x1": 202.743, "r_y1": 459.241, "r_x2": 202.743, "r_y2": 451.544, "r_x3": 70.031, "r_y3": 451.544, "coord_origin": "TOPLEFT"}, "text": "cong Li, Xin Tang, and Rong Xiao.", "orig": "cong Li, Xin Tang, and Rong Xiao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.001, "r_y0": 459.241, "r_x1": 286.363, "r_y1": 459.241, "r_x2": 286.363, "r_y2": 451.544, "r_x3": 209.001, "r_y3": 451.544, "coord_origin": "TOPLEFT"}, "text": "Pingan-vcgroup's so-", "orig": "Pingan-vcgroup's so-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 470.2, "r_x1": 286.363, "r_y1": 470.2, "r_x2": 286.363, "r_y2": 462.503, "r_x3": 70.031, "r_y3": 462.503, "coord_origin": "TOPLEFT"}, "text": "lution for icdar 2021 competition on scientific table image", "orig": "lution for icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 481.159, "r_x1": 141.87, "r_y1": 481.159, "r_x2": 141.87, "r_y2": 473.462, "r_x3": 70.031, "r_y3": 473.462, "coord_origin": "TOPLEFT"}, "text": "recognition to latex.", "orig": "recognition to latex.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.097, "r_y0": 481.03, "r_x1": 166.016, "r_y1": 481.03, "r_x2": 166.016, "r_y2": 473.3, "r_x3": 145.097, "r_y3": 473.3, "coord_origin": "TOPLEFT"}, "text": "ArXiv", "orig": "ArXiv", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.015, "r_y0": 481.159, "r_x1": 259.902, "r_y1": 481.159, "r_x2": 259.902, "r_y2": 473.462, "r_x3": 166.015, "r_y3": 473.462, "coord_origin": "TOPLEFT"}, "text": ", abs/2105.01846, 2021. 2", "orig": ", abs/2105.01846, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "list_item", "bbox": {"l": 50.112, "t": 484.733, "r": 286.363, "b": 536.266, "coord_origin": "TOPLEFT"}, "confidence": 0.9299950003623962, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 492.43, "r_x1": 65.05, "r_y1": 492.43, "r_x2": 65.05, "r_y2": 484.733, "r_x3": 50.112, "r_y3": 484.733, "coord_origin": "TOPLEFT"}, "text": "[11]", "orig": "[11]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 492.43, "r_x1": 117.091, "r_y1": 492.43, "r_x2": 117.091, "r_y2": 484.733, "r_x3": 70.035, "r_y3": 484.733, "coord_origin": "TOPLEFT"}, "text": "Jianying Hu,", "orig": "Jianying Hu,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 121.054, "r_y0": 492.43, "r_x1": 286.359, "r_y1": 492.43, "r_x2": 286.359, "r_y2": 484.733, "r_x3": 121.054, "r_y3": 484.733, "coord_origin": "TOPLEFT"}, "text": "Ramanujan S Kashi, Daniel P Lopresti, and", "orig": "Ramanujan S Kashi, Daniel P Lopresti, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 503.389, "r_x1": 132.15, "r_y1": 503.389, "r_x2": 132.15, "r_y2": 495.692, "r_x3": 70.031, "r_y3": 495.692, "coord_origin": "TOPLEFT"}, "text": "Gordon Wilfong.", "orig": "Gordon Wilfong.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.691, "r_y0": 503.389, "r_x1": 273.362, "r_y1": 503.389, "r_x2": 273.362, "r_y2": 495.692, "r_x3": 137.691, "r_y3": 495.692, "coord_origin": "TOPLEFT"}, "text": "Medium-independent table detection.", "orig": "Medium-independent table detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.894, "r_y0": 503.389, "r_x1": 286.363, "r_y1": 503.389, "r_x2": 286.363, "r_y2": 495.692, "r_x3": 278.894, "r_y3": 495.692, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 514.219, "r_x1": 106.883, "r_y1": 514.219, "r_x2": 106.883, "r_y2": 506.489, "r_x3": 70.031, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "Document", "orig": "Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 111.796, "r_y0": 514.219, "r_x1": 155.041, "r_y1": 514.219, "r_x2": 155.041, "r_y2": 506.489, "r_x3": 111.796, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.946, "r_y0": 514.219, "r_x1": 173.396, "r_y1": 514.219, "r_x2": 173.396, "r_y2": 506.489, "r_x3": 159.946, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.309, "r_y0": 514.219, "r_x1": 211.046, "r_y1": 514.219, "r_x2": 211.046, "r_y2": 506.489, "r_x3": 178.309, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "Retrieval", "orig": "Retrieval", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.959, "r_y0": 514.219, "r_x1": 227.409, "r_y1": 514.219, "r_x2": 227.409, "r_y2": 506.489, "r_x3": 215.959, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "VII", "orig": "VII", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.405, "r_y0": 514.348, "r_x1": 229.647, "r_y1": 514.348, "r_x2": 229.647, "r_y2": 506.651, "r_x3": 227.405, "r_y3": 506.651, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.56, "r_y0": 514.348, "r_x1": 261.28, "r_y1": 514.348, "r_x2": 261.28, "r_y2": 506.651, "r_x3": 234.56, "r_y3": 506.651, "coord_origin": "TOPLEFT"}, "text": "volume", "orig": "volume", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.185, "r_y0": 514.348, "r_x1": 286.359, "r_y1": 514.348, "r_x2": 286.359, "r_y2": 506.651, "r_x3": 266.185, "r_y3": 506.651, "coord_origin": "TOPLEFT"}, "text": "3967,", "orig": "3967,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 525.307, "r_x1": 286.363, "r_y1": 525.307, "r_x2": 286.363, "r_y2": 517.61, "r_x3": 70.031, "r_y3": 517.61, "coord_origin": "TOPLEFT"}, "text": "pages 291-302. International Society for Optics and Photon-", "orig": "pages 291-302. International Society for Optics and Photon-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 536.266, "r_x1": 112.361, "r_y1": 536.266, "r_x2": 112.361, "r_y2": 528.569, "r_x3": 70.031, "r_y3": 528.569, "coord_origin": "TOPLEFT"}, "text": "ics, 1999. 2", "orig": "ics, 1999. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "list_item", "bbox": {"l": 50.112, "t": 539.841, "r": 286.363, "b": 591.373, "coord_origin": "TOPLEFT"}, "confidence": 0.9394103288650513, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 547.538, "r_x1": 65.05, "r_y1": 547.538, "r_x2": 65.05, "r_y2": 539.841, "r_x3": 50.112, "r_y3": 539.841, "coord_origin": "TOPLEFT"}, "text": "[12]", "orig": "[12]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 547.538, "r_x1": 126.407, "r_y1": 547.538, "r_x2": 126.407, "r_y2": 539.841, "r_x3": 70.035, "r_y3": 539.841, "coord_origin": "TOPLEFT"}, "text": "Matthew Hurst.", "orig": "Matthew Hurst.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 130.648, "r_y0": 547.538, "r_x1": 286.359, "r_y1": 547.538, "r_x2": 286.359, "r_y2": 539.841, "r_x3": 130.648, "r_y3": 539.841, "coord_origin": "TOPLEFT"}, "text": "A constraint-based approach to table struc-", "orig": "A constraint-based approach to table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 558.4970000000001, "r_x1": 124.654, "r_y1": 558.4970000000001, "r_x2": 124.654, "r_y2": 550.8, "r_x3": 70.031, "r_y3": 550.8, "coord_origin": "TOPLEFT"}, "text": "ture derivation.", "orig": "ture derivation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.815, "r_y0": 558.4970000000001, "r_x1": 136.284, "r_y1": 558.4970000000001, "r_x2": 136.284, "r_y2": 550.8, "r_x3": 128.815, "r_y3": 550.8, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.811, "r_y0": 558.3679999999999, "r_x1": 286.362, "r_y1": 558.3679999999999, "r_x2": 286.362, "r_y2": 550.638, "r_x3": 138.811, "r_y3": 550.638, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the Seventh International", "orig": "Proceedings of the Seventh International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 569.327, "r_x1": 286.363, "r_y1": 569.327, "r_x2": 286.363, "r_y2": 561.597, "r_x3": 70.031, "r_y3": 561.597, "coord_origin": "TOPLEFT"}, "text": "Conference on Document Analysis and Recognition - Volume", "orig": "Conference on Document Analysis and Recognition - Volume", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 580.2860000000001, "r_x1": 74.514, "r_y1": 580.2860000000001, "r_x2": 74.514, "r_y2": 572.556, "r_x3": 70.031, "r_y3": 572.556, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 74.514, "r_y0": 580.415, "r_x1": 76.756, "r_y1": 580.415, "r_x2": 76.756, "r_y2": 572.718, "r_x3": 74.514, "r_y3": 572.718, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 79.06, "r_y0": 580.415, "r_x1": 286.363, "r_y1": 580.415, "r_x2": 286.363, "r_y2": 572.718, "r_x3": 79.06, "r_y3": 572.718, "coord_origin": "TOPLEFT"}, "text": "ICDAR '03, page 911, USA, 2003. IEEE Computer Soci-", "orig": "ICDAR '03, page 911, USA, 2003. IEEE Computer Soci-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 591.373, "r_x1": 82.647, "r_y1": 591.373, "r_x2": 82.647, "r_y2": 583.6759999999999, "r_x3": 70.031, "r_y3": 583.6759999999999, "coord_origin": "TOPLEFT"}, "text": "ety.", "orig": "ety.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.875, "r_y0": 591.373, "r_x1": 90.358, "r_y1": 591.373, "r_x2": 90.358, "r_y2": 583.6759999999999, "r_x3": 85.875, "r_y3": 583.6759999999999, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "list_item", "bbox": {"l": 50.112, "t": 594.948, "r": 286.363, "b": 646.481, "coord_origin": "TOPLEFT"}, "confidence": 0.9298838973045349, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 602.645, "r_x1": 65.05, "r_y1": 602.645, "r_x2": 65.05, "r_y2": 594.948, "r_x3": 50.112, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "[13]", "orig": "[13]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 602.645, "r_x1": 116.302, "r_y1": 602.645, "r_x2": 116.302, "r_y2": 594.948, "r_x3": 70.035, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Thotreingam", "orig": "Thotreingam", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 121.368, "r_y0": 602.645, "r_x1": 144.161, "r_y1": 602.645, "r_x2": 144.161, "r_y2": 594.948, "r_x3": 121.368, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Kasar,", "orig": "Kasar,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.926, "r_y0": 602.645, "r_x1": 186.796, "r_y1": 602.645, "r_x2": 186.796, "r_y2": 594.948, "r_x3": 149.926, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Philippine", "orig": "Philippine", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 191.862, "r_y0": 602.645, "r_x1": 217.013, "r_y1": 602.645, "r_x2": 217.013, "r_y2": 594.948, "r_x3": 191.862, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Barlas,", "orig": "Barlas,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.778, "r_y0": 602.645, "r_x1": 257.146, "r_y1": 602.645, "r_x2": 257.146, "r_y2": 594.948, "r_x3": 222.778, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Sebastien", "orig": "Sebastien", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.203, "r_y0": 602.645, "r_x1": 286.359, "r_y1": 602.645, "r_x2": 286.359, "r_y2": 594.948, "r_x3": 262.203, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Adam,", "orig": "Adam,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 613.604, "r_x1": 214.838, "r_y1": 613.604, "r_x2": 214.838, "r_y2": 605.907, "r_x3": 70.031, "r_y3": 605.907, "coord_origin": "TOPLEFT"}, "text": "Cl\u00b4ment Chatelain, and Thierry Paquet.", "orig": "Cl\u00b4ment Chatelain, and Thierry Paquet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.504, "r_y0": 613.604, "r_x1": 82.485, "r_y1": 613.604, "r_x2": 82.485, "r_y2": 605.907, "r_x3": 78.504, "r_y3": 605.907, "coord_origin": "TOPLEFT"}, "text": "e", "orig": "e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.949, "r_y0": 613.604, "r_x1": 286.363, "r_y1": 613.604, "r_x2": 286.363, "r_y2": 605.907, "r_x3": 219.949, "r_y3": 605.907, "coord_origin": "TOPLEFT"}, "text": "Learning to detect", "orig": "Learning to detect", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 624.563, "r_x1": 286.363, "r_y1": 624.563, "r_x2": 286.363, "r_y2": 616.866, "r_x3": 70.031, "r_y3": 616.866, "coord_origin": "TOPLEFT"}, "text": "tables in scanned document images using line information.", "orig": "tables in scanned document images using line information.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 635.5219999999999, "r_x1": 77.5, "r_y1": 635.5219999999999, "r_x2": 77.5, "r_y2": 627.825, "r_x3": 70.031, "r_y3": 627.825, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 79.92, "r_y0": 635.393, "r_x1": 286.362, "r_y1": 635.393, "r_x2": 286.362, "r_y2": 627.663, "r_x3": 79.92, "r_y3": 627.663, "coord_origin": "TOPLEFT"}, "text": "2013 12th International Conference on Document Analy-", "orig": "2013 12th International Conference on Document Analy-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 646.352, "r_x1": 140.677, "r_y1": 646.352, "r_x2": 140.677, "r_y2": 638.6220000000001, "r_x3": 70.031, "r_y3": 638.6220000000001, "coord_origin": "TOPLEFT"}, "text": "sis and Recognition", "orig": "sis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.676, "r_y0": 646.481, "r_x1": 264.439, "r_y1": 646.481, "r_x2": 264.439, "r_y2": 638.784, "r_x3": 140.676, "r_y3": 638.784, "coord_origin": "TOPLEFT"}, "text": ", pages 1185-1189. IEEE, 2013. 2", "orig": ", pages 1185-1189. IEEE, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "list_item", "bbox": {"l": 50.112, "t": 650.056, "r": 286.363, "b": 679.67, "coord_origin": "TOPLEFT"}, "confidence": 0.9115257263183594, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 657.7529999999999, "r_x1": 65.05, "r_y1": 657.7529999999999, "r_x2": 65.05, "r_y2": 650.056, "r_x3": 50.112, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "[14]", "orig": "[14]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 657.7529999999999, "r_x1": 91.447, "r_y1": 657.7529999999999, "r_x2": 91.447, "r_y2": 650.056, "r_x3": 70.035, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Pratik", "orig": "Pratik", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.092, "r_y0": 657.7529999999999, "r_x1": 119.745, "r_y1": 657.7529999999999, "r_x2": 119.745, "r_y2": 650.056, "r_x3": 96.092, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Kayal,", "orig": "Kayal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.99, "r_y0": 657.7529999999999, "r_x1": 149.397, "r_y1": 657.7529999999999, "r_x2": 149.397, "r_y2": 650.056, "r_x3": 124.99, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Mrinal", "orig": "Mrinal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.042, "r_y0": 657.7529999999999, "r_x1": 180.188, "r_y1": 657.7529999999999, "r_x2": 180.188, "r_y2": 650.056, "r_x3": 154.042, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Anand,", "orig": "Anand,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.433, "r_y0": 657.7529999999999, "r_x1": 206.845, "r_y1": 657.7529999999999, "r_x2": 206.845, "r_y2": 650.056, "r_x3": 185.433, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Harsh", "orig": "Harsh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.489, "r_y0": 657.7529999999999, "r_x1": 234.147, "r_y1": 657.7529999999999, "r_x2": 234.147, "r_y2": 650.056, "r_x3": 211.489, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Desai,", "orig": "Desai,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.393, "r_y0": 657.7529999999999, "r_x1": 252.34, "r_y1": 657.7529999999999, "r_x2": 252.34, "r_y2": 650.056, "r_x3": 239.393, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.976, "r_y0": 657.7529999999999, "r_x1": 286.359, "r_y1": 657.7529999999999, "r_x2": 286.359, "r_y2": 650.056, "r_x3": 256.976, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Mayank", "orig": "Mayank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 668.711, "r_x1": 93.2, "r_y1": 668.711, "r_x2": 93.2, "r_y2": 661.014, "r_x3": 70.031, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "Singh.", "orig": "Singh.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 102.202, "r_y0": 668.711, "r_x1": 120.619, "r_y1": 668.711, "r_x2": 120.619, "r_y2": 661.014, "r_x3": 102.202, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "Icdar", "orig": "Icdar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.672, "r_y0": 668.711, "r_x1": 238.922, "r_y1": 668.711, "r_x2": 238.922, "r_y2": 661.014, "r_x3": 124.672, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "2021 competition on scientific", "orig": "2021 competition on scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.975, "r_y0": 668.711, "r_x1": 260.406, "r_y1": 668.711, "r_x2": 260.406, "r_y2": 661.014, "r_x3": 242.975, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.449, "r_y0": 668.711, "r_x1": 286.363, "r_y1": 668.711, "r_x2": 286.363, "r_y2": 661.014, "r_x3": 264.449, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 679.67, "r_x1": 171.997, "r_y1": 679.67, "r_x2": 171.997, "r_y2": 671.973, "r_x3": 70.031, "r_y3": 671.973, "coord_origin": "TOPLEFT"}, "text": "recognition to latex, 2021. 2", "orig": "recognition to latex, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "list_item", "bbox": {"l": 50.112, "t": 683.245, "r": 286.359, "b": 712.86, "coord_origin": "TOPLEFT"}, "confidence": 0.912230372428894, "cells": [{"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 690.942, "r_x1": 65.05, "r_y1": 690.942, "r_x2": 65.05, "r_y2": 683.245, "r_x3": 50.112, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "[15]", "orig": "[15]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 690.942, "r_x1": 286.359, "r_y1": 690.942, "r_x2": 286.359, "r_y2": 683.245, "r_x3": 70.035, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "Harold WKuhn. The hungarian method for the assignment", "orig": "Harold WKuhn. The hungarian method for the assignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 701.901, "r_x1": 102.158, "r_y1": 701.901, "r_x2": 102.158, "r_y2": 694.204, "r_x3": 70.031, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "problem.", "orig": "problem.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 107.55, "r_y0": 701.772, "r_x1": 231.475, "r_y1": 701.772, "r_x2": 231.475, "r_y2": 694.042, "r_x3": 107.55, "r_y3": 694.042, "coord_origin": "TOPLEFT"}, "text": "Naval research logistics quarterly", "orig": "Naval research logistics quarterly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 231.476, "r_y0": 701.901, "r_x1": 233.718, "r_y1": 701.901, "r_x2": 233.718, "r_y2": 694.204, "r_x3": 231.476, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.802, "r_y0": 701.901, "r_x1": 286.359, "r_y1": 701.901, "r_x2": 286.359, "r_y2": 694.204, "r_x3": 236.802, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "2(1-2):83-97,", "orig": "2(1-2):83-97,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 712.86, "r_x1": 97.917, "r_y1": 712.86, "r_x2": 97.917, "r_y2": 705.163, "r_x3": 70.031, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "1955. 6", "orig": "1955. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "list_item", "bbox": {"l": 308.862, "t": 76.12599999999998, "r": 545.115, "b": 138.61699999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9389600157737732, "cells": [{"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 83.82299999999998, "r_x1": 323.8, "r_y1": 83.82299999999998, "r_x2": 323.8, "r_y2": 76.12599999999998, "r_x3": 308.862, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "[16]", "orig": "[16]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 83.82299999999998, "r_x1": 351.192, "r_y1": 83.82299999999998, "r_x2": 351.192, "r_y2": 76.12599999999998, "r_x3": 328.785, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Girish", "orig": "Girish", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 355.308, "r_y0": 83.82299999999998, "r_x1": 389.291, "r_y1": 83.82299999999998, "r_x2": 389.291, "r_y2": 76.12599999999998, "r_x3": 355.308, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Kulkarni,", "orig": "Kulkarni,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.863, "r_y0": 83.82299999999998, "r_x1": 420.225, "r_y1": 83.82299999999998, "r_x2": 420.225, "r_y2": 76.12599999999998, "r_x3": 393.863, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Visruth", "orig": "Visruth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.331, "r_y0": 83.82299999999998, "r_x1": 454.961, "r_y1": 83.82299999999998, "r_x2": 454.961, "r_y2": 76.12599999999998, "r_x3": 424.331, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Premraj,", "orig": "Premraj,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.533, "r_y0": 83.82299999999998, "r_x1": 486.881, "r_y1": 83.82299999999998, "r_x2": 486.881, "r_y2": 76.12599999999998, "r_x3": 459.533, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Vicente", "orig": "Vicente", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.988, "r_y0": 83.82299999999998, "r_x1": 524.1, "r_y1": 83.82299999999998, "r_x2": 524.1, "r_y2": 76.12599999999998, "r_x3": 490.988, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Ordonez,", "orig": "Ordonez,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.673, "r_y0": 83.82299999999998, "r_x1": 545.109, "r_y1": 83.82299999999998, "r_x2": 545.109, "r_y2": 76.12599999999998, "r_x3": 528.673, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Sag-", "orig": "Sag-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 94.78099999999995, "r_x1": 545.113, "r_y1": 94.78099999999995, "r_x2": 545.113, "r_y2": 87.08399999999995, "r_x3": 328.781, "r_y3": 87.08399999999995, "coord_origin": "TOPLEFT"}, "text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 105.74000000000001, "r_x1": 390.963, "r_y1": 105.74000000000001, "r_x2": 390.963, "r_y2": 98.043, "r_x3": 328.781, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "Tamara L. Berg.", "orig": "Tamara L. Berg.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.27, "r_y0": 105.74000000000001, "r_x1": 435.14, "r_y1": 105.74000000000001, "r_x2": 435.14, "r_y2": 98.043, "r_x3": 400.27, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "Babytalk:", "orig": "Babytalk:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.713, "r_y0": 105.74000000000001, "r_x1": 494.507, "r_y1": 105.74000000000001, "r_x2": 494.507, "r_y2": 98.043, "r_x3": 441.713, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "Understanding", "orig": "Understanding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.649, "r_y0": 105.74000000000001, "r_x1": 545.113, "r_y1": 105.74000000000001, "r_x2": 545.113, "r_y2": 98.043, "r_x3": 498.649, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "and generat-", "orig": "and generat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 116.69899999999996, "r_x1": 440.807, "r_y1": 116.69899999999996, "r_x2": 440.807, "r_y2": 109.00199999999995, "r_x3": 328.781, "r_y3": 109.00199999999995, "coord_origin": "TOPLEFT"}, "text": "ing simple image descriptions.", "orig": "ing simple image descriptions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 446.635, "r_y0": 116.57000000000005, "r_x1": 545.113, "r_y1": 116.57000000000005, "r_x2": 545.113, "r_y2": 108.84000000000003, "r_x3": 446.635, "r_y3": 108.84000000000003, "coord_origin": "TOPLEFT"}, "text": "IEEE Transactions on Pat-", "orig": "IEEE Transactions on Pat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 127.529, "r_x1": 471.132, "r_y1": 127.529, "r_x2": 471.132, "r_y2": 119.79899999999998, "r_x3": 328.781, "r_y3": 119.79899999999998, "coord_origin": "TOPLEFT"}, "text": "tern Analysis and Machine Intelligence", "orig": "tern Analysis and Machine Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 471.133, "r_y0": 127.65800000000002, "r_x1": 473.375, "r_y1": 127.65800000000002, "r_x2": 473.375, "r_y2": 119.96100000000001, "r_x3": 471.133, "r_y3": 119.96100000000001, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.127, "r_y0": 127.65800000000002, "r_x1": 545.115, "r_y1": 127.65800000000002, "r_x2": 545.115, "r_y2": 119.96100000000001, "r_x3": 476.127, "r_y3": 119.96100000000001, "coord_origin": "TOPLEFT"}, "text": "35(12):2891-2903,", "orig": "35(12):2891-2903,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 138.61699999999996, "r_x1": 356.667, "r_y1": 138.61699999999996, "r_x2": 356.667, "r_y2": 130.91999999999996, "r_x3": 328.781, "r_y3": 130.91999999999996, "coord_origin": "TOPLEFT"}, "text": "2013. 4", "orig": "2013. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "list_item", "bbox": {"l": 308.862, "t": 142.36599999999999, "r": 545.113, "b": 171.98000000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9253129959106445, "cells": [{"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 150.063, "r_x1": 323.8, "r_y1": 150.063, "r_x2": 323.8, "r_y2": 142.36599999999999, "r_x3": 308.862, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "[17]", "orig": "[17]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 150.063, "r_x1": 375.698, "r_y1": 150.063, "r_x2": 375.698, "r_y2": 142.36599999999999, "r_x3": 328.785, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Minghao Li,", "orig": "Minghao Li,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.557, "r_y0": 150.063, "r_x1": 392.51, "r_y1": 150.063, "r_x2": 392.51, "r_y2": 142.36599999999999, "r_x3": 380.557, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Lei", "orig": "Lei", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.84, "r_y0": 150.063, "r_x1": 412.038, "r_y1": 150.063, "r_x2": 412.038, "r_y2": 142.36599999999999, "r_x3": 396.84, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Cui,", "orig": "Cui,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.889, "r_y0": 150.063, "r_x1": 478.246, "r_y1": 150.063, "r_x2": 478.246, "r_y2": 142.36599999999999, "r_x3": 416.889, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Shaohan Huang,", "orig": "Shaohan Huang,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.097, "r_y0": 150.063, "r_x1": 500.035, "r_y1": 150.063, "r_x2": 500.035, "r_y2": 142.36599999999999, "r_x3": 483.097, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Furu", "orig": "Furu", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 504.365, "r_y0": 150.063, "r_x1": 520.828, "r_y1": 150.063, "r_x2": 520.828, "r_y2": 142.36599999999999, "r_x3": 504.365, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Wei,", "orig": "Wei,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 525.679, "r_y0": 150.063, "r_x1": 545.109, "r_y1": 150.063, "r_x2": 545.109, "r_y2": 142.36599999999999, "r_x3": 525.679, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Ming", "orig": "Ming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 161.02099999999996, "r_x1": 414.446, "r_y1": 161.02099999999996, "r_x2": 414.446, "r_y2": 153.32399999999996, "r_x3": 328.781, "r_y3": 153.32399999999996, "coord_origin": "TOPLEFT"}, "text": "Zhou, and Zhoujun Li.", "orig": "Zhou, and Zhoujun Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 421.825, "r_y0": 161.02099999999996, "r_x1": 461.448, "r_y1": 161.02099999999996, "r_x2": 461.448, "r_y2": 153.32399999999996, "r_x3": 421.825, "r_y3": 153.32399999999996, "coord_origin": "TOPLEFT"}, "text": "Tablebank:", "orig": "Tablebank:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.828, "r_y0": 161.02099999999996, "r_x1": 545.113, "r_y1": 161.02099999999996, "r_x2": 545.113, "r_y2": 153.32399999999996, "r_x3": 466.828, "r_y3": 153.32399999999996, "coord_origin": "TOPLEFT"}, "text": "A benchmark dataset", "orig": "A benchmark dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 171.98000000000002, "r_x1": 493.628, "r_y1": 171.98000000000002, "r_x2": 493.628, "r_y2": 164.28300000000002, "r_x3": 328.781, "r_y3": 164.28300000000002, "coord_origin": "TOPLEFT"}, "text": "for table detection and recognition, 2019. 2, 3", "orig": "for table detection and recognition, 2019. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "list_item", "bbox": {"l": 308.862, "t": 175.72900000000004, "r": 545.113, "b": 260.13800000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.9299732446670532, "cells": [{"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 183.42600000000004, "r_x1": 323.8, "r_y1": 183.42600000000004, "r_x2": 323.8, "r_y2": 175.72900000000004, "r_x3": 308.862, "r_y3": 175.72900000000004, "coord_origin": "TOPLEFT"}, "text": "[18]", "orig": "[18]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 183.42600000000004, "r_x1": 545.109, "r_y1": 183.42600000000004, "r_x2": 545.109, "r_y2": 175.72900000000004, "r_x3": 328.785, "r_y3": 175.72900000000004, "coord_origin": "TOPLEFT"}, "text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 194.385, "r_x1": 375.397, "r_y1": 194.385, "r_x2": 375.397, "r_y2": 186.688, "r_x3": 328.781, "r_y3": 186.688, "coord_origin": "TOPLEFT"}, "text": "Xianhui Liu.", "orig": "Xianhui Liu.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 381.154, "r_y0": 194.385, "r_x1": 399.58, "r_y1": 194.385, "r_x2": 399.58, "r_y2": 186.688, "r_x3": 381.154, "r_y3": 186.688, "coord_origin": "TOPLEFT"}, "text": "Gfte:", "orig": "Gfte:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 403.937, "r_y0": 194.385, "r_x1": 545.113, "r_y1": 194.385, "r_x2": 545.113, "r_y2": 186.688, "r_x3": 403.937, "r_y3": 186.688, "coord_origin": "TOPLEFT"}, "text": "Graph-based financial table extraction.", "orig": "Graph-based financial table extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 205.34400000000005, "r_x1": 545.113, "r_y1": 205.34400000000005, "r_x2": 545.113, "r_y2": 197.64700000000005, "r_x3": 328.781, "r_y3": 197.64700000000005, "coord_origin": "TOPLEFT"}, "text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 216.303, "r_x1": 545.113, "r_y1": 216.303, "r_x2": 545.113, "r_y2": 208.606, "r_x3": 328.781, "r_y3": 208.606, "coord_origin": "TOPLEFT"}, "text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 227.26199999999994, "r_x1": 365.382, "r_y1": 227.26199999999994, "r_x2": 365.382, "r_y2": 219.56500000000005, "r_x3": 328.781, "r_y3": 219.56500000000005, "coord_origin": "TOPLEFT"}, "text": "Escalante,", "orig": "Escalante,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 369.237, "r_y0": 227.26199999999994, "r_x1": 479.264, "r_y1": 227.26199999999994, "r_x2": 479.264, "r_y2": 219.56500000000005, "r_x3": 369.237, "r_y3": 219.56500000000005, "coord_origin": "TOPLEFT"}, "text": "and Roberto Vezzani, editors,", "orig": "and Roberto Vezzani, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.119, "r_y0": 227.13300000000004, "r_x1": 545.113, "r_y1": 227.13300000000004, "r_x2": 545.113, "r_y2": 219.40300000000002, "r_x3": 483.119, "r_y3": 219.40300000000002, "coord_origin": "TOPLEFT"}, "text": "Pattern Recogni-", "orig": "Pattern Recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 238.091, "r_x1": 519.398, "r_y1": 238.091, "r_x2": 519.398, "r_y2": 230.361, "r_x3": 328.781, "r_y3": 230.361, "coord_origin": "TOPLEFT"}, "text": "tion. ICPR International Workshops and Challenges", "orig": "tion. ICPR International Workshops and Challenges", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 519.401, "r_y0": 238.22000000000003, "r_x1": 521.643, "r_y1": 238.22000000000003, "r_x2": 521.643, "r_y2": 230.52300000000002, "r_x3": 519.401, "r_y3": 230.52300000000002, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 524.691, "r_y0": 238.22000000000003, "r_x1": 545.108, "r_y1": 238.22000000000003, "r_x2": 545.108, "r_y2": 230.52300000000002, "r_x3": 524.691, "r_y3": 230.52300000000002, "coord_origin": "TOPLEFT"}, "text": "pages", "orig": "pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 249.17899999999997, "r_x1": 545.113, "r_y1": 249.17899999999997, "r_x2": 545.113, "r_y2": 241.48199999999997, "r_x3": 328.781, "r_y3": 241.48199999999997, "coord_origin": "TOPLEFT"}, "text": "644-658, Cham, 2021. Springer International Publishing. 2,", "orig": "644-658, Cham, 2021. Springer International Publishing. 2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 260.13800000000003, "r_x1": 333.264, "r_y1": 260.13800000000003, "r_x2": 333.264, "r_y2": 252.44100000000003, "r_x3": 328.781, "r_y3": 252.44100000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "list_item", "bbox": {"l": 308.862, "t": 263.88699999999994, "r": 545.114, "b": 326.378, "coord_origin": "TOPLEFT"}, "confidence": 0.937321662902832, "cells": [{"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 271.58399999999995, "r_x1": 323.8, "r_y1": 271.58399999999995, "r_x2": 323.8, "r_y2": 263.88699999999994, "r_x3": 308.862, "r_y3": 263.88699999999994, "coord_origin": "TOPLEFT"}, "text": "[19]", "orig": "[19]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 271.58399999999995, "r_x1": 545.109, "r_y1": 271.58399999999995, "r_x2": 545.109, "r_y2": 263.88699999999994, "r_x3": 328.785, "r_y3": 263.88699999999994, "coord_origin": "TOPLEFT"}, "text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 282.543, "r_x1": 545.113, "r_y1": 282.543, "r_x2": 545.113, "r_y2": 274.846, "r_x3": 328.781, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 293.502, "r_x1": 527.118, "r_y1": 293.502, "r_x2": 527.118, "r_y2": 285.805, "r_x3": 328.781, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar.", "orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 531.664, "r_y0": 293.502, "r_x1": 545.113, "r_y1": 293.502, "r_x2": 545.113, "r_y2": 285.805, "r_x3": 531.664, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Ro-", "orig": "Ro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 304.461, "r_x1": 343.549, "r_y1": 304.461, "r_x2": 343.549, "r_y2": 296.764, "r_x3": 328.781, "r_y3": 296.764, "coord_origin": "TOPLEFT"}, "text": "bust", "orig": "bust", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.44, "r_y0": 304.461, "r_x1": 545.113, "r_y1": 304.461, "r_x2": 545.113, "r_y2": 296.764, "r_x3": 347.44, "r_y3": 296.764, "coord_origin": "TOPLEFT"}, "text": "pdf document conversion using recurrent neural net-", "orig": "pdf document conversion using recurrent neural net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 315.419, "r_x1": 352.847, "r_y1": 315.419, "r_x2": 352.847, "r_y2": 307.722, "r_x3": 328.781, "r_y3": 307.722, "coord_origin": "TOPLEFT"}, "text": "works.", "orig": "works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.236, "r_y0": 315.29, "r_x1": 545.114, "r_y1": 315.29, "r_x2": 545.114, "r_y2": 307.56, "r_x3": 360.236, "r_y3": 307.56, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the AAAI Conference on Artificial", "orig": "Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 203, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 326.249, "r_x1": 371.022, "r_y1": 326.249, "r_x2": 371.022, "r_y2": 318.519, "r_x3": 328.781, "r_y3": 318.519, "coord_origin": "TOPLEFT"}, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 204, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 371.021, "r_y0": 326.378, "r_x1": 502.262, "r_y1": 326.378, "r_x2": 502.262, "r_y2": 318.681, "r_x3": 371.021, "r_y3": 318.681, "coord_origin": "TOPLEFT"}, "text": ", 35(17):15137-15145, May 2021. 1", "orig": ", 35(17):15137-15145, May 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "list_item", "bbox": {"l": 308.862, "t": 330.127, "r": 545.116, "b": 370.701, "coord_origin": "TOPLEFT"}, "confidence": 0.9027292728424072, "cells": [{"index": 205, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 337.824, "r_x1": 323.8, "r_y1": 337.824, "r_x2": 323.8, "r_y2": 330.127, "r_x3": 308.862, "r_y3": 330.127, "coord_origin": "TOPLEFT"}, "text": "[20]", "orig": "[20]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 206, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 337.824, "r_x1": 545.109, "r_y1": 337.824, "r_x2": 545.109, "r_y2": 330.127, "r_x3": 328.785, "r_y3": 330.127, "coord_origin": "TOPLEFT"}, "text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 207, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 348.783, "r_x1": 456.821, "r_y1": 348.783, "r_x2": 456.821, "r_y2": 341.086, "r_x3": 328.781, "r_y3": 341.086, "coord_origin": "TOPLEFT"}, "text": "Yongpan Wang, and Gui-Song Xia.", "orig": "Yongpan Wang, and Gui-Song Xia.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 208, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 460.991, "r_y0": 348.783, "r_x1": 545.113, "r_y1": 348.783, "r_x2": 545.113, "r_y2": 341.086, "r_x3": 460.991, "r_y3": 341.086, "coord_origin": "TOPLEFT"}, "text": "Parsing table structures", "orig": "Parsing table structures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 209, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 359.742, "r_x1": 370.421, "r_y1": 359.742, "r_x2": 370.421, "r_y2": 352.045, "r_x3": 328.781, "r_y3": 352.045, "coord_origin": "TOPLEFT"}, "text": "in the wild.", "orig": "in the wild.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 210, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.308, "r_y0": 359.742, "r_x1": 382.777, "r_y1": 359.742, "r_x2": 382.777, "r_y2": 352.045, "r_x3": 375.308, "r_y3": 352.045, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 211, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.541, "r_y0": 359.613, "r_x1": 545.116, "r_y1": 359.613, "r_x2": 545.116, "r_y2": 351.883, "r_x3": 385.541, "r_y3": 351.883, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE/CVF International", "orig": "Proceedings of the IEEE/CVF International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 212, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 370.572, "r_x1": 443.596, "r_y1": 370.572, "r_x2": 443.596, "r_y2": 362.842, "r_x3": 328.781, "r_y3": 362.842, "coord_origin": "TOPLEFT"}, "text": "Conference on Computer Vision", "orig": "Conference on Computer Vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 213, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 443.594, "r_y0": 370.701, "r_x1": 534.486, "r_y1": 370.701, "r_x2": 534.486, "r_y2": 363.004, "r_x3": 443.594, "r_y3": 363.004, "coord_origin": "TOPLEFT"}, "text": ", pages 944-952, 2021. 2", "orig": ", pages 944-952, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "list_item", "bbox": {"l": 308.862, "t": 374.449, "r": 545.113, "b": 436.941, "coord_origin": "TOPLEFT"}, "confidence": 0.882714569568634, "cells": [{"index": 214, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 382.146, "r_x1": 323.8, "r_y1": 382.146, "r_x2": 323.8, "r_y2": 374.449, "r_x3": 308.862, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "[21]", "orig": "[21]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 215, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 382.146, "r_x1": 362.66, "r_y1": 382.146, "r_x2": 362.66, "r_y2": 374.449, "r_x3": 328.785, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Shubham", "orig": "Shubham", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 216, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 368.695, "r_y0": 382.146, "r_x1": 389.613, "r_y1": 382.146, "r_x2": 389.613, "r_y2": 374.449, "r_x3": 368.695, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Singh", "orig": "Singh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 217, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.648, "r_y0": 382.146, "r_x1": 424.564, "r_y1": 382.146, "r_x2": 424.564, "r_y2": 374.449, "r_x3": 395.648, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Paliwal,", "orig": "Paliwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 218, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.549, "r_y0": 382.146, "r_x1": 488.504, "r_y1": 382.146, "r_x2": 488.504, "r_y2": 374.449, "r_x3": 431.549, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "D Vishwanath,", "orig": "D Vishwanath,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 219, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 495.48, "r_y0": 382.146, "r_x1": 515.412, "r_y1": 382.146, "r_x2": 515.412, "r_y2": 374.449, "r_x3": 495.48, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Rohit", "orig": "Rohit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 220, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 521.446, "r_y0": 382.146, "r_x1": 545.109, "r_y1": 382.146, "r_x2": 545.109, "r_y2": 374.449, "r_x3": 521.446, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Rahul,", "orig": "Rahul,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 221, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 393.105, "r_x1": 460.318, "r_y1": 393.105, "r_x2": 460.318, "r_y2": 385.408, "r_x3": 328.781, "r_y3": 385.408, "coord_origin": "TOPLEFT"}, "text": "Monika Sharma, and Lovekesh Vig.", "orig": "Monika Sharma, and Lovekesh Vig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 222, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.393, "r_y0": 393.105, "r_x1": 498.542, "r_y1": 393.105, "r_x2": 498.542, "r_y2": 385.408, "r_x3": 465.393, "r_y3": 385.408, "coord_origin": "TOPLEFT"}, "text": "Tablenet:", "orig": "Tablenet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 223, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.469, "r_y0": 393.105, "r_x1": 545.113, "r_y1": 393.105, "r_x2": 545.113, "r_y2": 385.408, "r_x3": 502.469, "r_y3": 385.408, "coord_origin": "TOPLEFT"}, "text": "Deep learn-", "orig": "Deep learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 224, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 404.064, "r_x1": 545.113, "r_y1": 404.064, "r_x2": 545.113, "r_y2": 396.367, "r_x3": 328.781, "r_y3": 396.367, "coord_origin": "TOPLEFT"}, "text": "ing model for end-to-end table detection and tabular data ex-", "orig": "ing model for end-to-end table detection and tabular data ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 225, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 415.023, "r_x1": 478.009, "r_y1": 415.023, "r_x2": 478.009, "r_y2": 407.326, "r_x3": 328.781, "r_y3": 407.326, "coord_origin": "TOPLEFT"}, "text": "traction from scanned document images.", "orig": "traction from scanned document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 226, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 484.07, "r_y0": 415.023, "r_x1": 491.539, "r_y1": 415.023, "r_x2": 491.539, "r_y2": 407.326, "r_x3": 484.07, "r_y3": 407.326, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 227, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 494.668, "r_y0": 414.894, "r_x1": 545.113, "r_y1": 414.894, "r_x2": 545.113, "r_y2": 407.164, "r_x3": 494.668, "r_y3": 407.164, "coord_origin": "TOPLEFT"}, "text": "2019 Interna-", "orig": "2019 Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 228, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 425.853, "r_x1": 349.709, "r_y1": 425.853, "r_x2": 349.709, "r_y2": 418.123, "r_x3": 328.781, "r_y3": 418.123, "coord_origin": "TOPLEFT"}, "text": "tional", "orig": "tional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 229, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 353.295, "r_y0": 425.853, "r_x1": 545.113, "r_y1": 425.853, "r_x2": 545.113, "r_y2": 418.123, "r_x3": 353.295, "r_y3": 418.123, "coord_origin": "TOPLEFT"}, "text": "Conference on Document Analysis and Recognition", "orig": "Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 230, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 436.812, "r_x1": 360.836, "r_y1": 436.812, "r_x2": 360.836, "r_y2": 429.082, "r_x3": 328.781, "r_y3": 429.082, "coord_origin": "TOPLEFT"}, "text": "(ICDAR)", "orig": "(ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 231, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.836, "r_y0": 436.941, "r_x1": 475.633, "r_y1": 436.941, "r_x2": 475.633, "r_y2": 429.244, "r_x3": 360.836, "r_y3": 429.244, "coord_origin": "TOPLEFT"}, "text": ", pages 128-133. IEEE, 2019. 1", "orig": ", pages 128-133. IEEE, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "list_item", "bbox": {"l": 308.862, "t": 440.689, "r": 545.115, "b": 557.975, "coord_origin": "TOPLEFT"}, "confidence": 0.8896440863609314, "cells": [{"index": 232, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 448.386, "r_x1": 323.8, "r_y1": 448.386, "r_x2": 323.8, "r_y2": 440.689, "r_x3": 308.862, "r_y3": 440.689, "coord_origin": "TOPLEFT"}, "text": "[22]", "orig": "[22]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 233, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 448.386, "r_x1": 545.109, "r_y1": 448.386, "r_x2": 545.109, "r_y2": 440.689, "r_x3": 328.785, "r_y3": 440.689, "coord_origin": "TOPLEFT"}, "text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 234, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 459.345, "r_x1": 545.113, "r_y1": 459.345, "r_x2": 545.113, "r_y2": 451.648, "r_x3": 328.781, "r_y3": 451.648, "coord_origin": "TOPLEFT"}, "text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 235, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 470.304, "r_x1": 343.477, "r_y1": 470.304, "r_x2": 343.477, "r_y2": 462.607, "r_x3": 328.781, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Lin,", "orig": "Lin,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 236, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.601, "r_y0": 470.304, "r_x1": 373.496, "r_y1": 470.304, "r_x2": 373.496, "r_y2": 462.607, "r_x3": 347.601, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Natalia", "orig": "Natalia", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 237, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.244, "r_y0": 470.304, "r_x1": 420.83, "r_y1": 470.304, "r_x2": 420.83, "r_y2": 462.607, "r_x3": 377.244, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Gimelshein,", "orig": "Gimelshein,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 238, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.955, "r_y0": 470.304, "r_x1": 473.239, "r_y1": 470.304, "r_x2": 473.239, "r_y2": 462.607, "r_x3": 424.955, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Luca Antiga,", "orig": "Luca Antiga,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 239, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.363, "r_y0": 470.304, "r_x1": 545.113, "r_y1": 470.304, "r_x2": 545.113, "r_y2": 462.607, "r_x3": 477.363, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Alban Desmaison,", "orig": "Alban Desmaison,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 240, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 481.263, "r_x1": 545.113, "r_y1": 481.263, "r_x2": 545.113, "r_y2": 473.566, "r_x3": 328.781, "r_y3": 473.566, "coord_origin": "TOPLEFT"}, "text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 241, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 492.222, "r_x1": 545.113, "r_y1": 492.222, "r_x2": 545.113, "r_y2": 484.525, "r_x3": 328.781, "r_y3": 484.525, "coord_origin": "TOPLEFT"}, "text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 242, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 503.181, "r_x1": 545.113, "r_y1": 503.181, "r_x2": 545.113, "r_y2": 495.484, "r_x3": 328.781, "r_y3": 495.484, "coord_origin": "TOPLEFT"}, "text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 243, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 514.14, "r_x1": 545.113, "r_y1": 514.14, "r_x2": 545.113, "r_y2": 506.443, "r_x3": 328.781, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "perative style, high-performance deep learning library. In H.", "orig": "perative style, high-performance deep learning library. In H.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 244, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 525.0989999999999, "r_x1": 545.11, "r_y1": 525.0989999999999, "r_x2": 545.11, "r_y2": 517.402, "r_x3": 328.781, "r_y3": 517.402, "coord_origin": "TOPLEFT"}, "text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4-Buc, E.", "orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4-Buc, E.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 245, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 511.145, "r_y0": 525.0989999999999, "r_x1": 515.126, "r_y1": 525.0989999999999, "r_x2": 515.126, "r_y2": 517.402, "r_x3": 511.145, "r_y3": 517.402, "coord_origin": "TOPLEFT"}, "text": "e", "orig": "e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 246, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 536.057, "r_x1": 434.567, "r_y1": 536.057, "r_x2": 434.567, "r_y2": 528.36, "r_x3": 328.781, "r_y3": 528.36, "coord_origin": "TOPLEFT"}, "text": "Fox, and R. Garnett, editors,", "orig": "Fox, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 247, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.864, "r_y0": 535.928, "r_x1": 545.111, "r_y1": 535.928, "r_x2": 545.111, "r_y2": 528.198, "r_x3": 437.864, "r_y3": 528.198, "coord_origin": "TOPLEFT"}, "text": "Advances in Neural Informa-", "orig": "Advances in Neural Informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 248, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 546.887, "r_x1": 425.735, "r_y1": 546.887, "r_x2": 425.735, "r_y2": 539.157, "r_x3": 328.781, "r_y3": 539.157, "coord_origin": "TOPLEFT"}, "text": "tion Processing Systems 32", "orig": "tion Processing Systems 32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 249, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 425.736, "r_y0": 547.016, "r_x1": 545.115, "r_y1": 547.016, "r_x2": 545.115, "r_y2": 539.319, "r_x3": 425.736, "r_y3": 539.319, "coord_origin": "TOPLEFT"}, "text": ", pages 8024-8035. Curran Asso-", "orig": ", pages 8024-8035. Curran Asso-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 250, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 557.975, "r_x1": 399.741, "r_y1": 557.975, "r_x2": 399.741, "r_y2": 550.278, "r_x3": 328.781, "r_y3": 550.278, "coord_origin": "TOPLEFT"}, "text": "ciates, Inc., 2019. 6", "orig": "ciates, Inc., 2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "list_item", "bbox": {"l": 308.862, "t": 561.7239999999999, "r": 545.113, "b": 624.215, "coord_origin": "TOPLEFT"}, "confidence": 0.9025435447692871, "cells": [{"index": 251, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.421, "r_x1": 323.8, "r_y1": 569.421, "r_x2": 323.8, "r_y2": 561.7239999999999, "r_x3": 308.862, "r_y3": 561.7239999999999, "coord_origin": "TOPLEFT"}, "text": "[23]", "orig": "[23]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 252, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 569.421, "r_x1": 395.433, "r_y1": 569.421, "r_x2": 395.433, "r_y2": 561.7239999999999, "r_x3": 328.785, "r_y3": 561.7239999999999, "coord_origin": "TOPLEFT"}, "text": "Devashish Prasad,", "orig": "Devashish Prasad,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 253, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 399.369, "r_y0": 569.421, "r_x1": 545.109, "r_y1": 569.421, "r_x2": 545.109, "r_y2": 561.7239999999999, "r_x3": 399.369, "r_y3": 561.7239999999999, "coord_origin": "TOPLEFT"}, "text": "Ayan Gadpal, Kshitij Kapadni, Manish", "orig": "Ayan Gadpal, Kshitij Kapadni, Manish", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 254, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 580.38, "r_x1": 545.113, "r_y1": 580.38, "r_x2": 545.113, "r_y2": 572.683, "r_x3": 328.781, "r_y3": 572.683, "coord_origin": "TOPLEFT"}, "text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 255, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 591.3389999999999, "r_x1": 545.113, "r_y1": 591.3389999999999, "r_x2": 545.113, "r_y2": 583.642, "r_x3": 328.781, "r_y3": 583.642, "coord_origin": "TOPLEFT"}, "text": "for end to end table detection and structure recognition from", "orig": "for end to end table detection and structure recognition from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 256, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 602.298, "r_x1": 418.266, "r_y1": 602.298, "r_x2": 418.266, "r_y2": 594.601, "r_x3": 328.781, "r_y3": 594.601, "coord_origin": "TOPLEFT"}, "text": "image-based documents.", "orig": "image-based documents.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 257, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.148, "r_y0": 602.298, "r_x1": 431.617, "r_y1": 602.298, "r_x2": 431.617, "r_y2": 594.601, "r_x3": 424.148, "r_y3": 594.601, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 258, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 434.691, "r_y0": 602.169, "r_x1": 545.112, "r_y1": 602.169, "r_x2": 545.112, "r_y2": 594.439, "r_x3": 434.691, "r_y3": 594.439, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE/CVF", "orig": "Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 259, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 613.127, "r_x1": 369.784, "r_y1": 613.127, "r_x2": 369.784, "r_y2": 605.3969999999999, "r_x3": 328.781, "r_y3": 605.3969999999999, "coord_origin": "TOPLEFT"}, "text": "Conference", "orig": "Conference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 260, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.008, "r_y0": 613.127, "r_x1": 449.549, "r_y1": 613.127, "r_x2": 449.549, "r_y2": 605.3969999999999, "r_x3": 374.008, "r_y3": 605.3969999999999, "coord_origin": "TOPLEFT"}, "text": "on Computer Vision", "orig": "on Computer Vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 261, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.782, "r_y0": 613.127, "r_x1": 497.636, "r_y1": 613.127, "r_x2": 497.636, "r_y2": 605.3969999999999, "r_x3": 453.782, "r_y3": 605.3969999999999, "coord_origin": "TOPLEFT"}, "text": "and Pattern", "orig": "and Pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 262, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 501.868, "r_y0": 613.127, "r_x1": 545.113, "r_y1": 613.127, "r_x2": 545.113, "r_y2": 605.3969999999999, "r_x3": 501.868, "r_y3": 605.3969999999999, "coord_origin": "TOPLEFT"}, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 263, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 624.086, "r_x1": 367.803, "r_y1": 624.086, "r_x2": 367.803, "r_y2": 616.356, "r_x3": 328.781, "r_y3": 616.356, "coord_origin": "TOPLEFT"}, "text": "Workshops", "orig": "Workshops", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 264, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.802, "r_y0": 624.215, "r_x1": 458.694, "r_y1": 624.215, "r_x2": 458.694, "r_y2": 616.518, "r_x3": 367.802, "r_y3": 616.518, "coord_origin": "TOPLEFT"}, "text": ", pages 572-573, 2020. 1", "orig": ", pages 572-573, 2020. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 23, "label": "list_item", "bbox": {"l": 308.862, "t": 627.9639999999999, "r": 545.116, "b": 668.538, "coord_origin": "TOPLEFT"}, "confidence": 0.8777532577514648, "cells": [{"index": 265, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 635.6610000000001, "r_x1": 323.8, "r_y1": 635.6610000000001, "r_x2": 323.8, "r_y2": 627.9639999999999, "r_x3": 308.862, "r_y3": 627.9639999999999, "coord_origin": "TOPLEFT"}, "text": "[24]", "orig": "[24]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 266, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 635.6610000000001, "r_x1": 545.109, "r_y1": 635.6610000000001, "r_x2": 545.109, "r_y2": 627.9639999999999, "r_x3": 328.785, "r_y3": 627.9639999999999, "coord_origin": "TOPLEFT"}, "text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 267, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 646.62, "r_x1": 545.113, "r_y1": 646.62, "r_x2": 545.113, "r_y2": 638.923, "r_x3": 328.781, "r_y3": 638.923, "coord_origin": "TOPLEFT"}, "text": "Rethinking table recognition using graph neural networks.", "orig": "Rethinking table recognition using graph neural networks.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 268, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 657.579, "r_x1": 336.25, "r_y1": 657.579, "r_x2": 336.25, "r_y2": 649.8820000000001, "r_x3": 328.781, "r_y3": 649.8820000000001, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 269, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.1, "r_y0": 657.45, "r_x1": 545.116, "r_y1": 657.45, "r_x2": 545.116, "r_y2": 649.72, "r_x3": 338.1, "r_y3": 649.72, "coord_origin": "TOPLEFT"}, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 270, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 668.409, "r_x1": 406.322, "r_y1": 668.409, "r_x2": 406.322, "r_y2": 660.679, "r_x3": 328.781, "r_y3": 660.679, "coord_origin": "TOPLEFT"}, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 271, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 406.322, "r_y0": 668.538, "r_x1": 521.119, "r_y1": 668.538, "r_x2": 521.119, "r_y2": 660.841, "r_x3": 406.322, "r_y3": 660.841, "coord_origin": "TOPLEFT"}, "text": ", pages 142-147. IEEE, 2019. 3", "orig": ", pages 142-147. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 24, "label": "list_item", "bbox": {"l": 308.862, "t": 672.2860000000001, "r": 545.113, "b": 712.86, "coord_origin": "TOPLEFT"}, "confidence": 0.8654531240463257, "cells": [{"index": 272, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 679.983, "r_x1": 323.8, "r_y1": 679.983, "r_x2": 323.8, "r_y2": 672.2860000000001, "r_x3": 308.862, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "[25]", "orig": "[25]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 273, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 679.983, "r_x1": 400.857, "r_y1": 679.983, "r_x2": 400.857, "r_y2": 672.2860000000001, "r_x3": 328.785, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "Hamid Rezatofighi,", "orig": "Hamid Rezatofighi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 274, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 405.403, "r_y0": 679.983, "r_x1": 453.571, "r_y1": 679.983, "r_x2": 453.571, "r_y2": 672.2860000000001, "r_x3": 405.403, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "Nathan Tsoi,", "orig": "Nathan Tsoi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 275, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.117, "r_y0": 679.983, "r_x1": 521.635, "r_y1": 679.983, "r_x2": 521.635, "r_y2": 672.2860000000001, "r_x3": 458.117, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "JunYoung Gwak,", "orig": "JunYoung Gwak,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 276, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 526.181, "r_y0": 679.983, "r_x1": 545.109, "r_y1": 679.983, "r_x2": 545.109, "r_y2": 672.2860000000001, "r_x3": 526.181, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "Amir", "orig": "Amir", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 277, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 690.942, "r_x1": 482.815, "r_y1": 690.942, "r_x2": 482.815, "r_y2": 683.245, "r_x3": 328.781, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "Sadeghian, Ian Reid, and Silvio Savarese.", "orig": "Sadeghian, Ian Reid, and Silvio Savarese.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 278, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.751, "r_y0": 690.942, "r_x1": 545.113, "r_y1": 690.942, "r_x2": 545.113, "r_y2": 683.245, "r_x3": 488.751, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "Generalized in-", "orig": "Generalized in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 279, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 701.901, "r_x1": 545.113, "r_y1": 701.901, "r_x2": 545.113, "r_y2": 694.204, "r_x3": 328.781, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "tersection over union: A metric and a loss for bounding box", "orig": "tersection over union: A metric and a loss for bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 280, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 712.86, "r_x1": 367.74, "r_y1": 712.86, "r_x2": 367.74, "r_y2": 705.163, "r_x3": 328.781, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "regression.", "orig": "regression.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 281, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 371.685, "r_y0": 712.86, "r_x1": 379.154, "r_y1": 712.86, "r_x2": 379.154, "r_y2": 705.163, "r_x3": 371.685, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 282, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 381.616, "r_y0": 712.731, "r_x1": 545.109, "r_y1": 712.731, "r_x2": 545.109, "r_y2": 705.001, "r_x3": 381.616, "r_y3": 705.001, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE/CVF Conference on", "orig": "Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8797808885574341, "cells": [{"index": 283, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "list_item", "id": 25, "page_no": 8, "cluster": {"id": 25, "label": "list_item", "bbox": {"l": 70.031, "t": 76.12599999999998, "r": 286.363, "b": 116.69899999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.7310384511947632, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 83.82299999999998, "r_x1": 212.373, "r_y1": 83.82299999999998, "r_x2": 212.373, "r_y2": 76.12599999999998, "r_x3": 70.031, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "end object detection with transformers.", "orig": "end object detection with transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.313, "r_y0": 83.82299999999998, "r_x1": 286.363, "r_y1": 83.82299999999998, "r_x2": 286.363, "r_y2": 76.12599999999998, "r_x3": 217.313, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "In Andrea Vedaldi,", "orig": "In Andrea Vedaldi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 94.78200000000004, "r_x1": 286.363, "r_y1": 94.78200000000004, "r_x2": 286.363, "r_y2": 87.08500000000004, "r_x3": 70.031, "r_y3": 87.08500000000004, "coord_origin": "TOPLEFT"}, "text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 105.74000000000001, "r_x1": 85.722, "r_y1": 105.74000000000001, "r_x2": 85.722, "r_y2": 98.043, "r_x3": 70.031, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "tors,", "orig": "tors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.889, "r_y0": 105.61099999999999, "r_x1": 199.933, "r_y1": 105.61099999999999, "r_x2": 199.933, "r_y2": 97.88099999999997, "r_x3": 87.889, "r_y3": 97.88099999999997, "coord_origin": "TOPLEFT"}, "text": "Computer Vision - ECCV 2020", "orig": "Computer Vision - ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.936, "r_y0": 105.74000000000001, "r_x1": 286.363, "r_y1": 105.74000000000001, "r_x2": 286.363, "r_y2": 98.043, "r_x3": 199.936, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": ", pages 213-229, Cham,", "orig": ", pages 213-229, Cham,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 116.69899999999996, "r_x1": 221.949, "r_y1": 116.69899999999996, "r_x2": 221.949, "r_y2": 109.00199999999995, "r_x3": 70.031, "r_y3": 109.00199999999995, "coord_origin": "TOPLEFT"}, "text": "2020. Springer International Publishing. 5", "orig": "2020. Springer International Publishing. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "end object detection with transformers. In Andrea Vedaldi, Horst Bischof, Thomas Brox, and Jan-Michael Frahm, editors, Computer Vision - ECCV 2020 , pages 213-229, Cham, 2020. Springer International Publishing. 5"}, {"label": "list_item", "id": 9, "page_no": 8, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 54.595, "t": 120.274, "r": 286.363, "b": 149.889, "coord_origin": "TOPLEFT"}, "confidence": 0.9372755885124207, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 127.971, "r_x1": 65.05, "r_y1": 127.971, "r_x2": 65.05, "r_y2": 120.274, "r_x3": 54.595, "r_y3": 120.274, "coord_origin": "TOPLEFT"}, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 127.971, "r_x1": 286.359, "r_y1": 127.971, "r_x2": 286.359, "r_y2": 120.274, "r_x3": 70.035, "r_y3": 120.274, "coord_origin": "TOPLEFT"}, "text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 138.92999999999995, "r_x1": 179.672, "r_y1": 138.92999999999995, "r_x2": 179.672, "r_y2": 131.23299999999995, "r_x3": 70.031, "r_y3": 131.23299999999995, "coord_origin": "TOPLEFT"}, "text": "uan Yin, and Xian-Ling Mao.", "orig": "uan Yin, and Xian-Ling Mao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.581, "r_y0": 138.92999999999995, "r_x1": 286.363, "r_y1": 138.92999999999995, "r_x2": 286.363, "r_y2": 131.23299999999995, "r_x3": 185.581, "r_y3": 131.23299999999995, "coord_origin": "TOPLEFT"}, "text": "Complicated table structure", "orig": "Complicated table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 149.889, "r_x1": 113.115, "r_y1": 149.889, "r_x2": 113.115, "r_y2": 142.192, "r_x3": 70.031, "r_y3": 142.192, "coord_origin": "TOPLEFT"}, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.342, "r_y0": 149.76, "r_x1": 235.308, "r_y1": 149.76, "r_x2": 235.308, "r_y2": 142.02999999999997, "r_x3": 116.342, "r_y3": 142.02999999999997, "coord_origin": "TOPLEFT"}, "text": "arXiv preprint arXiv:1908.04729", "orig": "arXiv preprint arXiv:1908.04729", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.307, "r_y0": 149.889, "r_x1": 267.676, "r_y1": 149.889, "r_x2": 267.676, "r_y2": 142.192, "r_x3": 235.307, "r_y3": 142.192, "coord_origin": "TOPLEFT"}, "text": ", 2019. 3", "orig": ", 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[2] Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanxuan Yin, and Xian-Ling Mao. Complicated table structure recognition. arXiv preprint arXiv:1908.04729 , 2019. 3"}, {"label": "list_item", "id": 7, "page_no": 8, "cluster": {"id": 7, "label": "list_item", "bbox": {"l": 54.595, "t": 153.30200000000002, "r": 286.363, "b": 183.07799999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.9378374218940735, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 161.16099999999994, "r_x1": 65.05, "r_y1": 161.16099999999994, "r_x2": 65.05, "r_y2": 153.46400000000006, "r_x3": 54.595, "r_y3": 153.46400000000006, "coord_origin": "TOPLEFT"}, "text": "[3]", "orig": "[3]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 161.16099999999994, "r_x1": 218.779, "r_y1": 161.16099999999994, "r_x2": 218.779, "r_y2": 153.46400000000006, "r_x3": 70.035, "r_y3": 153.46400000000006, "coord_origin": "TOPLEFT"}, "text": "Bertrand Couasnon and Aurelie Lemaitre.", "orig": "Bertrand Couasnon and Aurelie Lemaitre.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.98, "r_y0": 161.03200000000004, "r_x1": 286.363, "r_y1": 161.03200000000004, "r_x2": 286.363, "r_y2": 153.30200000000002, "r_x3": 220.98, "r_y3": 153.30200000000002, "coord_origin": "TOPLEFT"}, "text": "Recognition of Ta-", "orig": "Recognition of Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 171.99099999999999, "r_x1": 125.264, "r_y1": 171.99099999999999, "r_x2": 125.264, "r_y2": 164.26099999999997, "r_x3": 70.031, "r_y3": 164.26099999999997, "coord_origin": "TOPLEFT"}, "text": "bles and Forms", "orig": "bles and Forms", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.261, "r_y0": 172.12, "r_x1": 127.503, "r_y1": 172.12, "r_x2": 127.503, "r_y2": 164.423, "r_x3": 125.261, "r_y3": 164.423, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.986, "r_y0": 172.12, "r_x1": 286.36, "r_y1": 172.12, "r_x2": 286.36, "r_y2": 164.423, "r_x3": 129.986, "r_y3": 164.423, "coord_origin": "TOPLEFT"}, "text": "pages 647-677. Springer London, London,", "orig": "pages 647-677. Springer London, London,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 183.07799999999997, "r_x1": 97.917, "r_y1": 183.07799999999997, "r_x2": 97.917, "r_y2": 175.38099999999997, "r_x3": 70.031, "r_y3": 175.38099999999997, "coord_origin": "TOPLEFT"}, "text": "2014. 2", "orig": "2014. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[3] Bertrand Couasnon and Aurelie Lemaitre. Recognition of Tables and Forms , pages 647-677. Springer London, London, 2014. 2"}, {"label": "list_item", "id": 0, "page_no": 8, "cluster": {"id": 0, "label": "list_item", "bbox": {"l": 54.595, "t": 186.65300000000002, "r": 286.364, "b": 227.22699999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9648825526237488, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 194.35000000000002, "r_x1": 65.05, "r_y1": 194.35000000000002, "r_x2": 65.05, "r_y2": 186.65300000000002, "r_x3": 54.595, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "[4]", "orig": "[4]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 194.35000000000002, "r_x1": 91.936, "r_y1": 194.35000000000002, "r_x2": 91.936, "r_y2": 186.65300000000002, "r_x3": 70.035, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Herv\u00b4 e", "orig": "Herv\u00b4 e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 97.101, "r_y0": 194.35000000000002, "r_x1": 124.736, "r_y1": 194.35000000000002, "r_x2": 124.736, "r_y2": 186.65300000000002, "r_x3": 97.101, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "D\u00b4jean,", "orig": "D\u00b4jean,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.575, "r_y0": 194.35000000000002, "r_x1": 107.556, "r_y1": 194.35000000000002, "r_x2": 107.556, "r_y2": 186.65300000000002, "r_x3": 103.575, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "e", "orig": "e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 130.636, "r_y0": 194.35000000000002, "r_x1": 163.497, "r_y1": 194.35000000000002, "r_x2": 163.497, "r_y2": 186.65300000000002, "r_x3": 130.636, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Jean-Luc", "orig": "Jean-Luc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.662, "r_y0": 194.35000000000002, "r_x1": 200.923, "r_y1": 194.35000000000002, "r_x2": 200.923, "r_y2": 186.65300000000002, "r_x3": 168.662, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Meunier,", "orig": "Meunier,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.814, "r_y0": 194.35000000000002, "r_x1": 238.188, "r_y1": 194.35000000000002, "r_x2": 238.188, "r_y2": 186.65300000000002, "r_x3": 206.814, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Liangcai", "orig": "Liangcai", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.352, "r_y0": 194.35000000000002, "r_x1": 260.532, "r_y1": 194.35000000000002, "r_x2": 260.532, "r_y2": 186.65300000000002, "r_x3": 243.352, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Gao,", "orig": "Gao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.432, "r_y0": 194.35000000000002, "r_x1": 286.364, "r_y1": 194.35000000000002, "r_x2": 286.364, "r_y2": 186.65300000000002, "r_x3": 266.432, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Yilun", "orig": "Yilun", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 205.30899999999997, "r_x1": 269.605, "r_y1": 205.30899999999997, "r_x2": 269.605, "r_y2": 197.61199999999997, "r_x3": 70.031, "r_y3": 197.61199999999997, "coord_origin": "TOPLEFT"}, "text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang.", "orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.411, "r_y0": 205.30899999999997, "r_x1": 286.363, "r_y1": 205.30899999999997, "r_x2": 286.363, "r_y2": 197.61199999999997, "r_x3": 274.411, "r_y3": 197.61199999999997, "coord_origin": "TOPLEFT"}, "text": "IC-", "orig": "IC-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 216.26800000000003, "r_x1": 286.363, "r_y1": 216.26800000000003, "r_x2": 286.363, "r_y2": 208.57100000000003, "r_x3": 70.031, "r_y3": 208.57100000000003, "coord_origin": "TOPLEFT"}, "text": "DAR 2019 Competition on Table Detection and Recognition", "orig": "DAR 2019 Competition on Table Detection and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 227.22699999999998, "r_x1": 245.835, "r_y1": 227.22699999999998, "r_x2": 245.835, "r_y2": 219.52999999999997, "r_x3": 70.031, "r_y3": 219.52999999999997, "coord_origin": "TOPLEFT"}, "text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[4] Herv\u00b4 e D\u00b4jean, e Jean-Luc Meunier, Liangcai Gao, Yilun Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. ICDAR 2019 Competition on Table Detection and Recognition (cTDaR), Apr. 2019. http://sac.founderit.com/. 2"}, {"label": "list_item", "id": 1, "page_no": 8, "cluster": {"id": 1, "label": "list_item", "bbox": {"l": 54.595, "t": 230.80200000000002, "r": 286.363, "b": 271.375, "coord_origin": "TOPLEFT"}, "confidence": 0.9620943069458008, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 238.49900000000002, "r_x1": 65.05, "r_y1": 238.49900000000002, "r_x2": 65.05, "r_y2": 230.80200000000002, "r_x3": 54.595, "r_y3": 230.80200000000002, "coord_origin": "TOPLEFT"}, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 238.49900000000002, "r_x1": 286.359, "r_y1": 238.49900000000002, "r_x2": 286.359, "r_y2": 230.80200000000002, "r_x3": 70.035, "r_y3": 230.80200000000002, "coord_origin": "TOPLEFT"}, "text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 249.45799999999997, "r_x1": 286.363, "r_y1": 249.45799999999997, "r_x2": 286.363, "r_y2": 241.76099999999997, "r_x3": 70.031, "r_y3": 241.76099999999997, "coord_origin": "TOPLEFT"}, "text": "Stavros J Perantonis. Automatic table detection in document", "orig": "Stavros J Perantonis. Automatic table detection in document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 260.41600000000005, "r_x1": 108.398, "r_y1": 260.41600000000005, "r_x2": 108.398, "r_y2": 252.71900000000005, "r_x3": 70.031, "r_y3": 252.71900000000005, "coord_origin": "TOPLEFT"}, "text": "images. In", "orig": "images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.645, "r_y0": 260.28700000000003, "r_x1": 286.36, "r_y1": 260.28700000000003, "r_x2": 286.36, "r_y2": 252.55700000000002, "r_x3": 110.645, "r_y3": 252.55700000000002, "coord_origin": "TOPLEFT"}, "text": "International Conference on Pattern Recognition", "orig": "International Conference on Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 271.246, "r_x1": 140.579, "r_y1": 271.246, "r_x2": 140.579, "r_y2": 263.51599999999996, "r_x3": 70.031, "r_y3": 263.51599999999996, "coord_origin": "TOPLEFT"}, "text": "and Image Analysis", "orig": "and Image Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.578, "r_y0": 271.375, "r_x1": 266.475, "r_y1": 271.375, "r_x2": 266.475, "r_y2": 263.678, "r_x3": 140.578, "r_y3": 263.678, "coord_origin": "TOPLEFT"}, "text": ", pages 609-618. Springer, 2005. 2", "orig": ", pages 609-618. Springer, 2005. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[5] Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and Stavros J Perantonis. Automatic table detection in document images. In International Conference on Pattern Recognition and Image Analysis , pages 609-618. Springer, 2005. 2"}, {"label": "list_item", "id": 2, "page_no": 8, "cluster": {"id": 2, "label": "list_item", "bbox": {"l": 54.595, "t": 274.95000000000005, "r": 286.367, "b": 315.524, "coord_origin": "TOPLEFT"}, "confidence": 0.9555517435073853, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 282.647, "r_x1": 65.05, "r_y1": 282.647, "r_x2": 65.05, "r_y2": 274.95000000000005, "r_x3": 54.595, "r_y3": 274.95000000000005, "coord_origin": "TOPLEFT"}, "text": "[6]", "orig": "[6]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 282.647, "r_x1": 286.367, "r_y1": 282.647, "r_x2": 286.367, "r_y2": 274.95000000000005, "r_x3": 70.035, "r_y3": 274.95000000000005, "coord_origin": "TOPLEFT"}, "text": "MaxG\u00a8bel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "orig": "MaxG\u00a8bel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.719, "r_y0": 282.647, "r_x1": 99.202, "r_y1": 282.647, "r_x2": 99.202, "r_y2": 274.95000000000005, "r_x3": 94.719, "r_y3": 274.95000000000005, "coord_origin": "TOPLEFT"}, "text": "o", "orig": "o", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 293.606, "r_x1": 179.574, "r_y1": 293.606, "r_x2": 179.574, "r_y2": 285.909, "r_x3": 70.031, "r_y3": 285.909, "coord_origin": "TOPLEFT"}, "text": "Icdar 2013 table competition.", "orig": "Icdar 2013 table competition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.016, "r_y0": 293.606, "r_x1": 194.485, "r_y1": 293.606, "r_x2": 194.485, "r_y2": 285.909, "r_x3": 187.016, "r_y3": 285.909, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.044, "r_y0": 293.477, "r_x1": 286.363, "r_y1": 293.477, "r_x2": 286.363, "r_y2": 285.747, "r_x3": 198.044, "r_y3": 285.747, "coord_origin": "TOPLEFT"}, "text": "2013 12th International", "orig": "2013 12th International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 304.436, "r_x1": 260.199, "r_y1": 304.436, "r_x2": 260.199, "r_y2": 296.706, "r_x3": 70.031, "r_y3": 296.706, "coord_origin": "TOPLEFT"}, "text": "Conference on Document Analysis and Recognition", "orig": "Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 260.198, "r_y0": 304.565, "r_x1": 262.44, "r_y1": 304.565, "r_x2": 262.44, "r_y2": 296.868, "r_x3": 260.198, "r_y3": 296.868, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.945, "r_y0": 304.565, "r_x1": 286.362, "r_y1": 304.565, "r_x2": 286.362, "r_y2": 296.868, "r_x3": 265.945, "r_y3": 296.868, "coord_origin": "TOPLEFT"}, "text": "pages", "orig": "pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 315.524, "r_x1": 142.749, "r_y1": 315.524, "r_x2": 142.749, "r_y2": 307.827, "r_x3": 70.031, "r_y3": 307.827, "coord_origin": "TOPLEFT"}, "text": "1449-1453, 2013. 2", "orig": "1449-1453, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[6] MaxG\u00a8bel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi. o Icdar 2013 table competition. In 2013 12th International Conference on Document Analysis and Recognition , pages 1449-1453, 2013. 2"}, {"label": "list_item", "id": 4, "page_no": 8, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 54.595, "t": 319.099, "r": 286.363, "b": 348.713, "coord_origin": "TOPLEFT"}, "confidence": 0.9479843378067017, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 326.796, "r_x1": 65.05, "r_y1": 326.796, "r_x2": 65.05, "r_y2": 319.099, "r_x3": 54.595, "r_y3": 319.099, "coord_origin": "TOPLEFT"}, "text": "[7]", "orig": "[7]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 326.796, "r_x1": 199.492, "r_y1": 326.796, "r_x2": 199.492, "r_y2": 319.099, "r_x3": 70.035, "r_y3": 319.099, "coord_origin": "TOPLEFT"}, "text": "EA Green and M Krishnamoorthy.", "orig": "EA Green and M Krishnamoorthy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.988, "r_y0": 326.796, "r_x1": 286.359, "r_y1": 326.796, "r_x2": 286.359, "r_y2": 319.099, "r_x3": 206.988, "r_y3": 319.099, "coord_origin": "TOPLEFT"}, "text": "Recognition of tables", "orig": "Recognition of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 337.754, "r_x1": 176.283, "r_y1": 337.754, "r_x2": 176.283, "r_y2": 330.057, "r_x3": 70.031, "r_y3": 330.057, "coord_origin": "TOPLEFT"}, "text": "using table grammars. procs.", "orig": "using table grammars. procs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.604, "r_y0": 337.754, "r_x1": 190.073, "r_y1": 337.754, "r_x2": 190.073, "r_y2": 330.057, "r_x3": 182.604, "r_y3": 330.057, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.283, "r_y0": 337.625, "r_x1": 286.363, "r_y1": 337.625, "r_x2": 286.363, "r_y2": 329.895, "r_x3": 193.283, "r_y3": 329.895, "coord_origin": "TOPLEFT"}, "text": "Symposium on Document", "orig": "Symposium on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 348.584, "r_x1": 206.347, "r_y1": 348.584, "r_x2": 206.347, "r_y2": 340.854, "r_x3": 70.031, "r_y3": 340.854, "coord_origin": "TOPLEFT"}, "text": "Analysis and Recognition (SDAIR'95)", "orig": "Analysis and Recognition (SDAIR'95)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.346, "r_y0": 348.713, "r_x1": 274.822, "r_y1": 348.713, "r_x2": 274.822, "r_y2": 341.016, "r_x3": 206.346, "r_y3": 341.016, "coord_origin": "TOPLEFT"}, "text": ", pages 261-277. 2", "orig": ", pages 261-277. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[7] EA Green and M Krishnamoorthy. Recognition of tables using table grammars. procs. In Symposium on Document Analysis and Recognition (SDAIR'95) , pages 261-277. 2"}, {"label": "list_item", "id": 3, "page_no": 8, "cluster": {"id": 3, "label": "list_item", "bbox": {"l": 54.595, "t": 352.288, "r": 286.363, "b": 403.821, "coord_origin": "TOPLEFT"}, "confidence": 0.9484425187110901, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 359.985, "r_x1": 65.05, "r_y1": 359.985, "r_x2": 65.05, "r_y2": 352.288, "r_x3": 54.595, "r_y3": 352.288, "coord_origin": "TOPLEFT"}, "text": "[8]", "orig": "[8]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 359.985, "r_x1": 286.359, "r_y1": 359.985, "r_x2": 286.359, "r_y2": 352.288, "r_x3": 70.035, "r_y3": 352.288, "coord_origin": "TOPLEFT"}, "text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 370.944, "r_x1": 234.125, "r_y1": 370.944, "r_x2": 234.125, "r_y2": 363.247, "r_x3": 70.031, "r_y3": 363.247, "coord_origin": "TOPLEFT"}, "text": "dier Stricker, and Muhammad Zeshan Afzal.", "orig": "dier Stricker, and Muhammad Zeshan Afzal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.052, "r_y0": 370.944, "r_x1": 286.363, "r_y1": 370.944, "r_x2": 286.363, "r_y2": 363.247, "r_x3": 240.052, "r_y3": 363.247, "coord_origin": "TOPLEFT"}, "text": "Castabdetec-", "orig": "Castabdetec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 381.903, "r_x1": 85.973, "r_y1": 381.903, "r_x2": 85.973, "r_y2": 374.206, "r_x3": 70.031, "r_y3": 374.206, "coord_origin": "TOPLEFT"}, "text": "tors:", "orig": "tors:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 90.349, "r_y0": 381.903, "r_x1": 286.363, "r_y1": 381.903, "r_x2": 286.363, "r_y2": 374.206, "r_x3": 90.349, "r_y3": 374.206, "coord_origin": "TOPLEFT"}, "text": "Cascade network for table detection in document im-", "orig": "Cascade network for table detection in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 392.862, "r_x1": 286.363, "r_y1": 392.862, "r_x2": 286.363, "r_y2": 385.165, "r_x3": 70.031, "r_y3": 385.165, "coord_origin": "TOPLEFT"}, "text": "ages with recursive feature pyramid and switchable atrous", "orig": "ages with recursive feature pyramid and switchable atrous", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 403.821, "r_x1": 114.576, "r_y1": 403.821, "r_x2": 114.576, "r_y2": 396.124, "r_x3": 70.031, "r_y3": 396.124, "coord_origin": "TOPLEFT"}, "text": "convolution.", "orig": "convolution.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 117.804, "r_y0": 403.692, "r_x1": 186.729, "r_y1": 403.692, "r_x2": 186.729, "r_y2": 395.962, "r_x3": 117.804, "r_y3": 395.962, "coord_origin": "TOPLEFT"}, "text": "Journal of Imaging", "orig": "Journal of Imaging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 186.728, "r_y0": 403.821, "r_x1": 243.001, "r_y1": 403.821, "r_x2": 243.001, "r_y2": 396.124, "r_x3": 186.728, "r_y3": 396.124, "coord_origin": "TOPLEFT"}, "text": ", 7(10), 2021. 1", "orig": ", 7(10), 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[8] Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Didier Stricker, and Muhammad Zeshan Afzal. Castabdetectors: Cascade network for table detection in document images with recursive feature pyramid and switchable atrous convolution. Journal of Imaging , 7(10), 2021. 1"}, {"label": "list_item", "id": 10, "page_no": 8, "cluster": {"id": 10, "label": "list_item", "bbox": {"l": 54.595, "t": 407.395, "r": 286.36, "b": 437.01, "coord_origin": "TOPLEFT"}, "confidence": 0.9330756664276123, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 415.092, "r_x1": 65.05, "r_y1": 415.092, "r_x2": 65.05, "r_y2": 407.395, "r_x3": 54.595, "r_y3": 407.395, "coord_origin": "TOPLEFT"}, "text": "[9]", "orig": "[9]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 415.092, "r_x1": 286.359, "r_y1": 415.092, "r_x2": 286.359, "r_y2": 407.395, "r_x3": 70.035, "r_y3": 407.395, "coord_origin": "TOPLEFT"}, "text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 426.051, "r_x1": 147.133, "r_y1": 426.051, "r_x2": 147.133, "r_y2": 418.354, "r_x3": 70.031, "r_y3": 418.354, "coord_origin": "TOPLEFT"}, "text": "shick. Mask r-cnn. In", "orig": "shick. Mask r-cnn. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.156, "r_y0": 425.922, "r_x1": 286.36, "r_y1": 425.922, "r_x2": 286.36, "r_y2": 418.192, "r_x3": 149.156, "r_y3": 418.192, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE International", "orig": "Proceedings of the IEEE International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 436.881, "r_x1": 213.484, "r_y1": 436.881, "r_x2": 213.484, "r_y2": 429.151, "r_x3": 70.031, "r_y3": 429.151, "coord_origin": "TOPLEFT"}, "text": "Conference on Computer Vision (ICCV)", "orig": "Conference on Computer Vision (ICCV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 213.483, "r_y0": 437.01, "r_x1": 261.041, "r_y1": 437.01, "r_x2": 261.041, "r_y2": 429.313, "r_x3": 213.483, "r_y3": 429.313, "coord_origin": "TOPLEFT"}, "text": ", Oct 2017. 1", "orig": ", Oct 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[9] Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Girshick. Mask r-cnn. In Proceedings of the IEEE International Conference on Computer Vision (ICCV) , Oct 2017. 1"}, {"label": "list_item", "id": 14, "page_no": 8, "cluster": {"id": 14, "label": "list_item", "bbox": {"l": 50.112, "t": 440.585, "r": 286.363, "b": 481.159, "coord_origin": "TOPLEFT"}, "confidence": 0.9274735450744629, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 448.282, "r_x1": 65.05, "r_y1": 448.282, "r_x2": 65.05, "r_y2": 440.585, "r_x3": 50.112, "r_y3": 440.585, "coord_origin": "TOPLEFT"}, "text": "[10]", "orig": "[10]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 448.282, "r_x1": 286.359, "r_y1": 448.282, "r_x2": 286.359, "r_y2": 440.585, "r_x3": 70.035, "r_y3": 440.585, "coord_origin": "TOPLEFT"}, "text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 459.241, "r_x1": 202.743, "r_y1": 459.241, "r_x2": 202.743, "r_y2": 451.544, "r_x3": 70.031, "r_y3": 451.544, "coord_origin": "TOPLEFT"}, "text": "cong Li, Xin Tang, and Rong Xiao.", "orig": "cong Li, Xin Tang, and Rong Xiao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.001, "r_y0": 459.241, "r_x1": 286.363, "r_y1": 459.241, "r_x2": 286.363, "r_y2": 451.544, "r_x3": 209.001, "r_y3": 451.544, "coord_origin": "TOPLEFT"}, "text": "Pingan-vcgroup's so-", "orig": "Pingan-vcgroup's so-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 470.2, "r_x1": 286.363, "r_y1": 470.2, "r_x2": 286.363, "r_y2": 462.503, "r_x3": 70.031, "r_y3": 462.503, "coord_origin": "TOPLEFT"}, "text": "lution for icdar 2021 competition on scientific table image", "orig": "lution for icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 481.159, "r_x1": 141.87, "r_y1": 481.159, "r_x2": 141.87, "r_y2": 473.462, "r_x3": 70.031, "r_y3": 473.462, "coord_origin": "TOPLEFT"}, "text": "recognition to latex.", "orig": "recognition to latex.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.097, "r_y0": 481.03, "r_x1": 166.016, "r_y1": 481.03, "r_x2": 166.016, "r_y2": 473.3, "r_x3": 145.097, "r_y3": 473.3, "coord_origin": "TOPLEFT"}, "text": "ArXiv", "orig": "ArXiv", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.015, "r_y0": 481.159, "r_x1": 259.902, "r_y1": 481.159, "r_x2": 259.902, "r_y2": 473.462, "r_x3": 166.015, "r_y3": 473.462, "coord_origin": "TOPLEFT"}, "text": ", abs/2105.01846, 2021. 2", "orig": ", abs/2105.01846, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[10] Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bingcong Li, Xin Tang, and Rong Xiao. Pingan-vcgroup's solution for icdar 2021 competition on scientific table image recognition to latex. ArXiv , abs/2105.01846, 2021. 2"}, {"label": "list_item", "id": 11, "page_no": 8, "cluster": {"id": 11, "label": "list_item", "bbox": {"l": 50.112, "t": 484.733, "r": 286.363, "b": 536.266, "coord_origin": "TOPLEFT"}, "confidence": 0.9299950003623962, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 492.43, "r_x1": 65.05, "r_y1": 492.43, "r_x2": 65.05, "r_y2": 484.733, "r_x3": 50.112, "r_y3": 484.733, "coord_origin": "TOPLEFT"}, "text": "[11]", "orig": "[11]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 492.43, "r_x1": 117.091, "r_y1": 492.43, "r_x2": 117.091, "r_y2": 484.733, "r_x3": 70.035, "r_y3": 484.733, "coord_origin": "TOPLEFT"}, "text": "Jianying Hu,", "orig": "Jianying Hu,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 121.054, "r_y0": 492.43, "r_x1": 286.359, "r_y1": 492.43, "r_x2": 286.359, "r_y2": 484.733, "r_x3": 121.054, "r_y3": 484.733, "coord_origin": "TOPLEFT"}, "text": "Ramanujan S Kashi, Daniel P Lopresti, and", "orig": "Ramanujan S Kashi, Daniel P Lopresti, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 503.389, "r_x1": 132.15, "r_y1": 503.389, "r_x2": 132.15, "r_y2": 495.692, "r_x3": 70.031, "r_y3": 495.692, "coord_origin": "TOPLEFT"}, "text": "Gordon Wilfong.", "orig": "Gordon Wilfong.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.691, "r_y0": 503.389, "r_x1": 273.362, "r_y1": 503.389, "r_x2": 273.362, "r_y2": 495.692, "r_x3": 137.691, "r_y3": 495.692, "coord_origin": "TOPLEFT"}, "text": "Medium-independent table detection.", "orig": "Medium-independent table detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.894, "r_y0": 503.389, "r_x1": 286.363, "r_y1": 503.389, "r_x2": 286.363, "r_y2": 495.692, "r_x3": 278.894, "r_y3": 495.692, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 514.219, "r_x1": 106.883, "r_y1": 514.219, "r_x2": 106.883, "r_y2": 506.489, "r_x3": 70.031, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "Document", "orig": "Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 111.796, "r_y0": 514.219, "r_x1": 155.041, "r_y1": 514.219, "r_x2": 155.041, "r_y2": 506.489, "r_x3": 111.796, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.946, "r_y0": 514.219, "r_x1": 173.396, "r_y1": 514.219, "r_x2": 173.396, "r_y2": 506.489, "r_x3": 159.946, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.309, "r_y0": 514.219, "r_x1": 211.046, "r_y1": 514.219, "r_x2": 211.046, "r_y2": 506.489, "r_x3": 178.309, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "Retrieval", "orig": "Retrieval", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.959, "r_y0": 514.219, "r_x1": 227.409, "r_y1": 514.219, "r_x2": 227.409, "r_y2": 506.489, "r_x3": 215.959, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "VII", "orig": "VII", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.405, "r_y0": 514.348, "r_x1": 229.647, "r_y1": 514.348, "r_x2": 229.647, "r_y2": 506.651, "r_x3": 227.405, "r_y3": 506.651, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.56, "r_y0": 514.348, "r_x1": 261.28, "r_y1": 514.348, "r_x2": 261.28, "r_y2": 506.651, "r_x3": 234.56, "r_y3": 506.651, "coord_origin": "TOPLEFT"}, "text": "volume", "orig": "volume", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.185, "r_y0": 514.348, "r_x1": 286.359, "r_y1": 514.348, "r_x2": 286.359, "r_y2": 506.651, "r_x3": 266.185, "r_y3": 506.651, "coord_origin": "TOPLEFT"}, "text": "3967,", "orig": "3967,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 525.307, "r_x1": 286.363, "r_y1": 525.307, "r_x2": 286.363, "r_y2": 517.61, "r_x3": 70.031, "r_y3": 517.61, "coord_origin": "TOPLEFT"}, "text": "pages 291-302. International Society for Optics and Photon-", "orig": "pages 291-302. International Society for Optics and Photon-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 536.266, "r_x1": 112.361, "r_y1": 536.266, "r_x2": 112.361, "r_y2": 528.569, "r_x3": 70.031, "r_y3": 528.569, "coord_origin": "TOPLEFT"}, "text": "ics, 1999. 2", "orig": "ics, 1999. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[11] Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and Gordon Wilfong. Medium-independent table detection. In Document Recognition and Retrieval VII , volume 3967, pages 291-302. International Society for Optics and Photonics, 1999. 2"}, {"label": "list_item", "id": 5, "page_no": 8, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 50.112, "t": 539.841, "r": 286.363, "b": 591.373, "coord_origin": "TOPLEFT"}, "confidence": 0.9394103288650513, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 547.538, "r_x1": 65.05, "r_y1": 547.538, "r_x2": 65.05, "r_y2": 539.841, "r_x3": 50.112, "r_y3": 539.841, "coord_origin": "TOPLEFT"}, "text": "[12]", "orig": "[12]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 547.538, "r_x1": 126.407, "r_y1": 547.538, "r_x2": 126.407, "r_y2": 539.841, "r_x3": 70.035, "r_y3": 539.841, "coord_origin": "TOPLEFT"}, "text": "Matthew Hurst.", "orig": "Matthew Hurst.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 130.648, "r_y0": 547.538, "r_x1": 286.359, "r_y1": 547.538, "r_x2": 286.359, "r_y2": 539.841, "r_x3": 130.648, "r_y3": 539.841, "coord_origin": "TOPLEFT"}, "text": "A constraint-based approach to table struc-", "orig": "A constraint-based approach to table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 558.4970000000001, "r_x1": 124.654, "r_y1": 558.4970000000001, "r_x2": 124.654, "r_y2": 550.8, "r_x3": 70.031, "r_y3": 550.8, "coord_origin": "TOPLEFT"}, "text": "ture derivation.", "orig": "ture derivation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.815, "r_y0": 558.4970000000001, "r_x1": 136.284, "r_y1": 558.4970000000001, "r_x2": 136.284, "r_y2": 550.8, "r_x3": 128.815, "r_y3": 550.8, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.811, "r_y0": 558.3679999999999, "r_x1": 286.362, "r_y1": 558.3679999999999, "r_x2": 286.362, "r_y2": 550.638, "r_x3": 138.811, "r_y3": 550.638, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the Seventh International", "orig": "Proceedings of the Seventh International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 569.327, "r_x1": 286.363, "r_y1": 569.327, "r_x2": 286.363, "r_y2": 561.597, "r_x3": 70.031, "r_y3": 561.597, "coord_origin": "TOPLEFT"}, "text": "Conference on Document Analysis and Recognition - Volume", "orig": "Conference on Document Analysis and Recognition - Volume", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 580.2860000000001, "r_x1": 74.514, "r_y1": 580.2860000000001, "r_x2": 74.514, "r_y2": 572.556, "r_x3": 70.031, "r_y3": 572.556, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 74.514, "r_y0": 580.415, "r_x1": 76.756, "r_y1": 580.415, "r_x2": 76.756, "r_y2": 572.718, "r_x3": 74.514, "r_y3": 572.718, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 79.06, "r_y0": 580.415, "r_x1": 286.363, "r_y1": 580.415, "r_x2": 286.363, "r_y2": 572.718, "r_x3": 79.06, "r_y3": 572.718, "coord_origin": "TOPLEFT"}, "text": "ICDAR '03, page 911, USA, 2003. IEEE Computer Soci-", "orig": "ICDAR '03, page 911, USA, 2003. IEEE Computer Soci-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 591.373, "r_x1": 82.647, "r_y1": 591.373, "r_x2": 82.647, "r_y2": 583.6759999999999, "r_x3": 70.031, "r_y3": 583.6759999999999, "coord_origin": "TOPLEFT"}, "text": "ety.", "orig": "ety.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.875, "r_y0": 591.373, "r_x1": 90.358, "r_y1": 591.373, "r_x2": 90.358, "r_y2": 583.6759999999999, "r_x3": 85.875, "r_y3": 583.6759999999999, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[12] Matthew Hurst. A constraint-based approach to table structure derivation. In Proceedings of the Seventh International Conference on Document Analysis and Recognition - Volume 2 , ICDAR '03, page 911, USA, 2003. IEEE Computer Society. 2"}, {"label": "list_item", "id": 13, "page_no": 8, "cluster": {"id": 13, "label": "list_item", "bbox": {"l": 50.112, "t": 594.948, "r": 286.363, "b": 646.481, "coord_origin": "TOPLEFT"}, "confidence": 0.9298838973045349, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 602.645, "r_x1": 65.05, "r_y1": 602.645, "r_x2": 65.05, "r_y2": 594.948, "r_x3": 50.112, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "[13]", "orig": "[13]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 602.645, "r_x1": 116.302, "r_y1": 602.645, "r_x2": 116.302, "r_y2": 594.948, "r_x3": 70.035, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Thotreingam", "orig": "Thotreingam", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 121.368, "r_y0": 602.645, "r_x1": 144.161, "r_y1": 602.645, "r_x2": 144.161, "r_y2": 594.948, "r_x3": 121.368, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Kasar,", "orig": "Kasar,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.926, "r_y0": 602.645, "r_x1": 186.796, "r_y1": 602.645, "r_x2": 186.796, "r_y2": 594.948, "r_x3": 149.926, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Philippine", "orig": "Philippine", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 191.862, "r_y0": 602.645, "r_x1": 217.013, "r_y1": 602.645, "r_x2": 217.013, "r_y2": 594.948, "r_x3": 191.862, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Barlas,", "orig": "Barlas,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.778, "r_y0": 602.645, "r_x1": 257.146, "r_y1": 602.645, "r_x2": 257.146, "r_y2": 594.948, "r_x3": 222.778, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Sebastien", "orig": "Sebastien", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.203, "r_y0": 602.645, "r_x1": 286.359, "r_y1": 602.645, "r_x2": 286.359, "r_y2": 594.948, "r_x3": 262.203, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Adam,", "orig": "Adam,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 613.604, "r_x1": 214.838, "r_y1": 613.604, "r_x2": 214.838, "r_y2": 605.907, "r_x3": 70.031, "r_y3": 605.907, "coord_origin": "TOPLEFT"}, "text": "Cl\u00b4ment Chatelain, and Thierry Paquet.", "orig": "Cl\u00b4ment Chatelain, and Thierry Paquet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.504, "r_y0": 613.604, "r_x1": 82.485, "r_y1": 613.604, "r_x2": 82.485, "r_y2": 605.907, "r_x3": 78.504, "r_y3": 605.907, "coord_origin": "TOPLEFT"}, "text": "e", "orig": "e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.949, "r_y0": 613.604, "r_x1": 286.363, "r_y1": 613.604, "r_x2": 286.363, "r_y2": 605.907, "r_x3": 219.949, "r_y3": 605.907, "coord_origin": "TOPLEFT"}, "text": "Learning to detect", "orig": "Learning to detect", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 624.563, "r_x1": 286.363, "r_y1": 624.563, "r_x2": 286.363, "r_y2": 616.866, "r_x3": 70.031, "r_y3": 616.866, "coord_origin": "TOPLEFT"}, "text": "tables in scanned document images using line information.", "orig": "tables in scanned document images using line information.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 635.5219999999999, "r_x1": 77.5, "r_y1": 635.5219999999999, "r_x2": 77.5, "r_y2": 627.825, "r_x3": 70.031, "r_y3": 627.825, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 79.92, "r_y0": 635.393, "r_x1": 286.362, "r_y1": 635.393, "r_x2": 286.362, "r_y2": 627.663, "r_x3": 79.92, "r_y3": 627.663, "coord_origin": "TOPLEFT"}, "text": "2013 12th International Conference on Document Analy-", "orig": "2013 12th International Conference on Document Analy-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 646.352, "r_x1": 140.677, "r_y1": 646.352, "r_x2": 140.677, "r_y2": 638.6220000000001, "r_x3": 70.031, "r_y3": 638.6220000000001, "coord_origin": "TOPLEFT"}, "text": "sis and Recognition", "orig": "sis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.676, "r_y0": 646.481, "r_x1": 264.439, "r_y1": 646.481, "r_x2": 264.439, "r_y2": 638.784, "r_x3": 140.676, "r_y3": 638.784, "coord_origin": "TOPLEFT"}, "text": ", pages 1185-1189. IEEE, 2013. 2", "orig": ", pages 1185-1189. IEEE, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[13] Thotreingam Kasar, Philippine Barlas, Sebastien Adam, Cl\u00b4ment Chatelain, and Thierry Paquet. e Learning to detect tables in scanned document images using line information. In 2013 12th International Conference on Document Analysis and Recognition , pages 1185-1189. IEEE, 2013. 2"}, {"label": "list_item", "id": 17, "page_no": 8, "cluster": {"id": 17, "label": "list_item", "bbox": {"l": 50.112, "t": 650.056, "r": 286.363, "b": 679.67, "coord_origin": "TOPLEFT"}, "confidence": 0.9115257263183594, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 657.7529999999999, "r_x1": 65.05, "r_y1": 657.7529999999999, "r_x2": 65.05, "r_y2": 650.056, "r_x3": 50.112, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "[14]", "orig": "[14]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 657.7529999999999, "r_x1": 91.447, "r_y1": 657.7529999999999, "r_x2": 91.447, "r_y2": 650.056, "r_x3": 70.035, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Pratik", "orig": "Pratik", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.092, "r_y0": 657.7529999999999, "r_x1": 119.745, "r_y1": 657.7529999999999, "r_x2": 119.745, "r_y2": 650.056, "r_x3": 96.092, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Kayal,", "orig": "Kayal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.99, "r_y0": 657.7529999999999, "r_x1": 149.397, "r_y1": 657.7529999999999, "r_x2": 149.397, "r_y2": 650.056, "r_x3": 124.99, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Mrinal", "orig": "Mrinal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.042, "r_y0": 657.7529999999999, "r_x1": 180.188, "r_y1": 657.7529999999999, "r_x2": 180.188, "r_y2": 650.056, "r_x3": 154.042, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Anand,", "orig": "Anand,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.433, "r_y0": 657.7529999999999, "r_x1": 206.845, "r_y1": 657.7529999999999, "r_x2": 206.845, "r_y2": 650.056, "r_x3": 185.433, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Harsh", "orig": "Harsh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.489, "r_y0": 657.7529999999999, "r_x1": 234.147, "r_y1": 657.7529999999999, "r_x2": 234.147, "r_y2": 650.056, "r_x3": 211.489, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Desai,", "orig": "Desai,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.393, "r_y0": 657.7529999999999, "r_x1": 252.34, "r_y1": 657.7529999999999, "r_x2": 252.34, "r_y2": 650.056, "r_x3": 239.393, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.976, "r_y0": 657.7529999999999, "r_x1": 286.359, "r_y1": 657.7529999999999, "r_x2": 286.359, "r_y2": 650.056, "r_x3": 256.976, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Mayank", "orig": "Mayank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 668.711, "r_x1": 93.2, "r_y1": 668.711, "r_x2": 93.2, "r_y2": 661.014, "r_x3": 70.031, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "Singh.", "orig": "Singh.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 102.202, "r_y0": 668.711, "r_x1": 120.619, "r_y1": 668.711, "r_x2": 120.619, "r_y2": 661.014, "r_x3": 102.202, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "Icdar", "orig": "Icdar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.672, "r_y0": 668.711, "r_x1": 238.922, "r_y1": 668.711, "r_x2": 238.922, "r_y2": 661.014, "r_x3": 124.672, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "2021 competition on scientific", "orig": "2021 competition on scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.975, "r_y0": 668.711, "r_x1": 260.406, "r_y1": 668.711, "r_x2": 260.406, "r_y2": 661.014, "r_x3": 242.975, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.449, "r_y0": 668.711, "r_x1": 286.363, "r_y1": 668.711, "r_x2": 286.363, "r_y2": 661.014, "r_x3": 264.449, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 679.67, "r_x1": 171.997, "r_y1": 679.67, "r_x2": 171.997, "r_y2": 671.973, "r_x3": 70.031, "r_y3": 671.973, "coord_origin": "TOPLEFT"}, "text": "recognition to latex, 2021. 2", "orig": "recognition to latex, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[14] Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank Singh. Icdar 2021 competition on scientific table image recognition to latex, 2021. 2"}, {"label": "list_item", "id": 16, "page_no": 8, "cluster": {"id": 16, "label": "list_item", "bbox": {"l": 50.112, "t": 683.245, "r": 286.359, "b": 712.86, "coord_origin": "TOPLEFT"}, "confidence": 0.912230372428894, "cells": [{"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 690.942, "r_x1": 65.05, "r_y1": 690.942, "r_x2": 65.05, "r_y2": 683.245, "r_x3": 50.112, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "[15]", "orig": "[15]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 690.942, "r_x1": 286.359, "r_y1": 690.942, "r_x2": 286.359, "r_y2": 683.245, "r_x3": 70.035, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "Harold WKuhn. The hungarian method for the assignment", "orig": "Harold WKuhn. The hungarian method for the assignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 701.901, "r_x1": 102.158, "r_y1": 701.901, "r_x2": 102.158, "r_y2": 694.204, "r_x3": 70.031, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "problem.", "orig": "problem.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 107.55, "r_y0": 701.772, "r_x1": 231.475, "r_y1": 701.772, "r_x2": 231.475, "r_y2": 694.042, "r_x3": 107.55, "r_y3": 694.042, "coord_origin": "TOPLEFT"}, "text": "Naval research logistics quarterly", "orig": "Naval research logistics quarterly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 231.476, "r_y0": 701.901, "r_x1": 233.718, "r_y1": 701.901, "r_x2": 233.718, "r_y2": 694.204, "r_x3": 231.476, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.802, "r_y0": 701.901, "r_x1": 286.359, "r_y1": 701.901, "r_x2": 286.359, "r_y2": 694.204, "r_x3": 236.802, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "2(1-2):83-97,", "orig": "2(1-2):83-97,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 712.86, "r_x1": 97.917, "r_y1": 712.86, "r_x2": 97.917, "r_y2": 705.163, "r_x3": 70.031, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "1955. 6", "orig": "1955. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[15] Harold WKuhn. The hungarian method for the assignment problem. Naval research logistics quarterly , 2(1-2):83-97, 1955. 6"}, {"label": "list_item", "id": 6, "page_no": 8, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 308.862, "t": 76.12599999999998, "r": 545.115, "b": 138.61699999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9389600157737732, "cells": [{"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 83.82299999999998, "r_x1": 323.8, "r_y1": 83.82299999999998, "r_x2": 323.8, "r_y2": 76.12599999999998, "r_x3": 308.862, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "[16]", "orig": "[16]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 83.82299999999998, "r_x1": 351.192, "r_y1": 83.82299999999998, "r_x2": 351.192, "r_y2": 76.12599999999998, "r_x3": 328.785, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Girish", "orig": "Girish", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 355.308, "r_y0": 83.82299999999998, "r_x1": 389.291, "r_y1": 83.82299999999998, "r_x2": 389.291, "r_y2": 76.12599999999998, "r_x3": 355.308, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Kulkarni,", "orig": "Kulkarni,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.863, "r_y0": 83.82299999999998, "r_x1": 420.225, "r_y1": 83.82299999999998, "r_x2": 420.225, "r_y2": 76.12599999999998, "r_x3": 393.863, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Visruth", "orig": "Visruth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.331, "r_y0": 83.82299999999998, "r_x1": 454.961, "r_y1": 83.82299999999998, "r_x2": 454.961, "r_y2": 76.12599999999998, "r_x3": 424.331, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Premraj,", "orig": "Premraj,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.533, "r_y0": 83.82299999999998, "r_x1": 486.881, "r_y1": 83.82299999999998, "r_x2": 486.881, "r_y2": 76.12599999999998, "r_x3": 459.533, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Vicente", "orig": "Vicente", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.988, "r_y0": 83.82299999999998, "r_x1": 524.1, "r_y1": 83.82299999999998, "r_x2": 524.1, "r_y2": 76.12599999999998, "r_x3": 490.988, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Ordonez,", "orig": "Ordonez,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.673, "r_y0": 83.82299999999998, "r_x1": 545.109, "r_y1": 83.82299999999998, "r_x2": 545.109, "r_y2": 76.12599999999998, "r_x3": 528.673, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Sag-", "orig": "Sag-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 94.78099999999995, "r_x1": 545.113, "r_y1": 94.78099999999995, "r_x2": 545.113, "r_y2": 87.08399999999995, "r_x3": 328.781, "r_y3": 87.08399999999995, "coord_origin": "TOPLEFT"}, "text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 105.74000000000001, "r_x1": 390.963, "r_y1": 105.74000000000001, "r_x2": 390.963, "r_y2": 98.043, "r_x3": 328.781, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "Tamara L. Berg.", "orig": "Tamara L. Berg.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.27, "r_y0": 105.74000000000001, "r_x1": 435.14, "r_y1": 105.74000000000001, "r_x2": 435.14, "r_y2": 98.043, "r_x3": 400.27, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "Babytalk:", "orig": "Babytalk:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.713, "r_y0": 105.74000000000001, "r_x1": 494.507, "r_y1": 105.74000000000001, "r_x2": 494.507, "r_y2": 98.043, "r_x3": 441.713, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "Understanding", "orig": "Understanding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.649, "r_y0": 105.74000000000001, "r_x1": 545.113, "r_y1": 105.74000000000001, "r_x2": 545.113, "r_y2": 98.043, "r_x3": 498.649, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "and generat-", "orig": "and generat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 116.69899999999996, "r_x1": 440.807, "r_y1": 116.69899999999996, "r_x2": 440.807, "r_y2": 109.00199999999995, "r_x3": 328.781, "r_y3": 109.00199999999995, "coord_origin": "TOPLEFT"}, "text": "ing simple image descriptions.", "orig": "ing simple image descriptions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 446.635, "r_y0": 116.57000000000005, "r_x1": 545.113, "r_y1": 116.57000000000005, "r_x2": 545.113, "r_y2": 108.84000000000003, "r_x3": 446.635, "r_y3": 108.84000000000003, "coord_origin": "TOPLEFT"}, "text": "IEEE Transactions on Pat-", "orig": "IEEE Transactions on Pat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 127.529, "r_x1": 471.132, "r_y1": 127.529, "r_x2": 471.132, "r_y2": 119.79899999999998, "r_x3": 328.781, "r_y3": 119.79899999999998, "coord_origin": "TOPLEFT"}, "text": "tern Analysis and Machine Intelligence", "orig": "tern Analysis and Machine Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 471.133, "r_y0": 127.65800000000002, "r_x1": 473.375, "r_y1": 127.65800000000002, "r_x2": 473.375, "r_y2": 119.96100000000001, "r_x3": 471.133, "r_y3": 119.96100000000001, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.127, "r_y0": 127.65800000000002, "r_x1": 545.115, "r_y1": 127.65800000000002, "r_x2": 545.115, "r_y2": 119.96100000000001, "r_x3": 476.127, "r_y3": 119.96100000000001, "coord_origin": "TOPLEFT"}, "text": "35(12):2891-2903,", "orig": "35(12):2891-2903,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 138.61699999999996, "r_x1": 356.667, "r_y1": 138.61699999999996, "r_x2": 356.667, "r_y2": 130.91999999999996, "r_x3": 328.781, "r_y3": 130.91999999999996, "coord_origin": "TOPLEFT"}, "text": "2013. 4", "orig": "2013. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[16] Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sagnik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and Tamara L. Berg. Babytalk: Understanding and generating simple image descriptions. IEEE Transactions on Pattern Analysis and Machine Intelligence , 35(12):2891-2903, 2013. 4"}, {"label": "list_item", "id": 15, "page_no": 8, "cluster": {"id": 15, "label": "list_item", "bbox": {"l": 308.862, "t": 142.36599999999999, "r": 545.113, "b": 171.98000000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9253129959106445, "cells": [{"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 150.063, "r_x1": 323.8, "r_y1": 150.063, "r_x2": 323.8, "r_y2": 142.36599999999999, "r_x3": 308.862, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "[17]", "orig": "[17]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 150.063, "r_x1": 375.698, "r_y1": 150.063, "r_x2": 375.698, "r_y2": 142.36599999999999, "r_x3": 328.785, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Minghao Li,", "orig": "Minghao Li,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.557, "r_y0": 150.063, "r_x1": 392.51, "r_y1": 150.063, "r_x2": 392.51, "r_y2": 142.36599999999999, "r_x3": 380.557, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Lei", "orig": "Lei", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.84, "r_y0": 150.063, "r_x1": 412.038, "r_y1": 150.063, "r_x2": 412.038, "r_y2": 142.36599999999999, "r_x3": 396.84, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Cui,", "orig": "Cui,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.889, "r_y0": 150.063, "r_x1": 478.246, "r_y1": 150.063, "r_x2": 478.246, "r_y2": 142.36599999999999, "r_x3": 416.889, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Shaohan Huang,", "orig": "Shaohan Huang,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.097, "r_y0": 150.063, "r_x1": 500.035, "r_y1": 150.063, "r_x2": 500.035, "r_y2": 142.36599999999999, "r_x3": 483.097, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Furu", "orig": "Furu", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 504.365, "r_y0": 150.063, "r_x1": 520.828, "r_y1": 150.063, "r_x2": 520.828, "r_y2": 142.36599999999999, "r_x3": 504.365, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Wei,", "orig": "Wei,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 525.679, "r_y0": 150.063, "r_x1": 545.109, "r_y1": 150.063, "r_x2": 545.109, "r_y2": 142.36599999999999, "r_x3": 525.679, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Ming", "orig": "Ming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 161.02099999999996, "r_x1": 414.446, "r_y1": 161.02099999999996, "r_x2": 414.446, "r_y2": 153.32399999999996, "r_x3": 328.781, "r_y3": 153.32399999999996, "coord_origin": "TOPLEFT"}, "text": "Zhou, and Zhoujun Li.", "orig": "Zhou, and Zhoujun Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 421.825, "r_y0": 161.02099999999996, "r_x1": 461.448, "r_y1": 161.02099999999996, "r_x2": 461.448, "r_y2": 153.32399999999996, "r_x3": 421.825, "r_y3": 153.32399999999996, "coord_origin": "TOPLEFT"}, "text": "Tablebank:", "orig": "Tablebank:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.828, "r_y0": 161.02099999999996, "r_x1": 545.113, "r_y1": 161.02099999999996, "r_x2": 545.113, "r_y2": 153.32399999999996, "r_x3": 466.828, "r_y3": 153.32399999999996, "coord_origin": "TOPLEFT"}, "text": "A benchmark dataset", "orig": "A benchmark dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 171.98000000000002, "r_x1": 493.628, "r_y1": 171.98000000000002, "r_x2": 493.628, "r_y2": 164.28300000000002, "r_x3": 328.781, "r_y3": 164.28300000000002, "coord_origin": "TOPLEFT"}, "text": "for table detection and recognition, 2019. 2, 3", "orig": "for table detection and recognition, 2019. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[17] Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming Zhou, and Zhoujun Li. Tablebank: A benchmark dataset for table detection and recognition, 2019. 2, 3"}, {"label": "list_item", "id": 12, "page_no": 8, "cluster": {"id": 12, "label": "list_item", "bbox": {"l": 308.862, "t": 175.72900000000004, "r": 545.113, "b": 260.13800000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.9299732446670532, "cells": [{"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 183.42600000000004, "r_x1": 323.8, "r_y1": 183.42600000000004, "r_x2": 323.8, "r_y2": 175.72900000000004, "r_x3": 308.862, "r_y3": 175.72900000000004, "coord_origin": "TOPLEFT"}, "text": "[18]", "orig": "[18]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 183.42600000000004, "r_x1": 545.109, "r_y1": 183.42600000000004, "r_x2": 545.109, "r_y2": 175.72900000000004, "r_x3": 328.785, "r_y3": 175.72900000000004, "coord_origin": "TOPLEFT"}, "text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 194.385, "r_x1": 375.397, "r_y1": 194.385, "r_x2": 375.397, "r_y2": 186.688, "r_x3": 328.781, "r_y3": 186.688, "coord_origin": "TOPLEFT"}, "text": "Xianhui Liu.", "orig": "Xianhui Liu.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 381.154, "r_y0": 194.385, "r_x1": 399.58, "r_y1": 194.385, "r_x2": 399.58, "r_y2": 186.688, "r_x3": 381.154, "r_y3": 186.688, "coord_origin": "TOPLEFT"}, "text": "Gfte:", "orig": "Gfte:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 403.937, "r_y0": 194.385, "r_x1": 545.113, "r_y1": 194.385, "r_x2": 545.113, "r_y2": 186.688, "r_x3": 403.937, "r_y3": 186.688, "coord_origin": "TOPLEFT"}, "text": "Graph-based financial table extraction.", "orig": "Graph-based financial table extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 205.34400000000005, "r_x1": 545.113, "r_y1": 205.34400000000005, "r_x2": 545.113, "r_y2": 197.64700000000005, "r_x3": 328.781, "r_y3": 197.64700000000005, "coord_origin": "TOPLEFT"}, "text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 216.303, "r_x1": 545.113, "r_y1": 216.303, "r_x2": 545.113, "r_y2": 208.606, "r_x3": 328.781, "r_y3": 208.606, "coord_origin": "TOPLEFT"}, "text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 227.26199999999994, "r_x1": 365.382, "r_y1": 227.26199999999994, "r_x2": 365.382, "r_y2": 219.56500000000005, "r_x3": 328.781, "r_y3": 219.56500000000005, "coord_origin": "TOPLEFT"}, "text": "Escalante,", "orig": "Escalante,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 369.237, "r_y0": 227.26199999999994, "r_x1": 479.264, "r_y1": 227.26199999999994, "r_x2": 479.264, "r_y2": 219.56500000000005, "r_x3": 369.237, "r_y3": 219.56500000000005, "coord_origin": "TOPLEFT"}, "text": "and Roberto Vezzani, editors,", "orig": "and Roberto Vezzani, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.119, "r_y0": 227.13300000000004, "r_x1": 545.113, "r_y1": 227.13300000000004, "r_x2": 545.113, "r_y2": 219.40300000000002, "r_x3": 483.119, "r_y3": 219.40300000000002, "coord_origin": "TOPLEFT"}, "text": "Pattern Recogni-", "orig": "Pattern Recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 238.091, "r_x1": 519.398, "r_y1": 238.091, "r_x2": 519.398, "r_y2": 230.361, "r_x3": 328.781, "r_y3": 230.361, "coord_origin": "TOPLEFT"}, "text": "tion. ICPR International Workshops and Challenges", "orig": "tion. ICPR International Workshops and Challenges", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 519.401, "r_y0": 238.22000000000003, "r_x1": 521.643, "r_y1": 238.22000000000003, "r_x2": 521.643, "r_y2": 230.52300000000002, "r_x3": 519.401, "r_y3": 230.52300000000002, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 524.691, "r_y0": 238.22000000000003, "r_x1": 545.108, "r_y1": 238.22000000000003, "r_x2": 545.108, "r_y2": 230.52300000000002, "r_x3": 524.691, "r_y3": 230.52300000000002, "coord_origin": "TOPLEFT"}, "text": "pages", "orig": "pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 249.17899999999997, "r_x1": 545.113, "r_y1": 249.17899999999997, "r_x2": 545.113, "r_y2": 241.48199999999997, "r_x3": 328.781, "r_y3": 241.48199999999997, "coord_origin": "TOPLEFT"}, "text": "644-658, Cham, 2021. Springer International Publishing. 2,", "orig": "644-658, Cham, 2021. Springer International Publishing. 2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 260.13800000000003, "r_x1": 333.264, "r_y1": 260.13800000000003, "r_x2": 333.264, "r_y2": 252.44100000000003, "r_x3": 328.781, "r_y3": 252.44100000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[18] Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and Xianhui Liu. Gfte: Graph-based financial table extraction. In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Giovanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair Escalante, and Roberto Vezzani, editors, Pattern Recognition. ICPR International Workshops and Challenges , pages 644-658, Cham, 2021. Springer International Publishing. 2, 3"}, {"label": "list_item", "id": 8, "page_no": 8, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 308.862, "t": 263.88699999999994, "r": 545.114, "b": 326.378, "coord_origin": "TOPLEFT"}, "confidence": 0.937321662902832, "cells": [{"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 271.58399999999995, "r_x1": 323.8, "r_y1": 271.58399999999995, "r_x2": 323.8, "r_y2": 263.88699999999994, "r_x3": 308.862, "r_y3": 263.88699999999994, "coord_origin": "TOPLEFT"}, "text": "[19]", "orig": "[19]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 271.58399999999995, "r_x1": 545.109, "r_y1": 271.58399999999995, "r_x2": 545.109, "r_y2": 263.88699999999994, "r_x3": 328.785, "r_y3": 263.88699999999994, "coord_origin": "TOPLEFT"}, "text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 282.543, "r_x1": 545.113, "r_y1": 282.543, "r_x2": 545.113, "r_y2": 274.846, "r_x3": 328.781, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 293.502, "r_x1": 527.118, "r_y1": 293.502, "r_x2": 527.118, "r_y2": 285.805, "r_x3": 328.781, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar.", "orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 531.664, "r_y0": 293.502, "r_x1": 545.113, "r_y1": 293.502, "r_x2": 545.113, "r_y2": 285.805, "r_x3": 531.664, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Ro-", "orig": "Ro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 304.461, "r_x1": 343.549, "r_y1": 304.461, "r_x2": 343.549, "r_y2": 296.764, "r_x3": 328.781, "r_y3": 296.764, "coord_origin": "TOPLEFT"}, "text": "bust", "orig": "bust", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.44, "r_y0": 304.461, "r_x1": 545.113, "r_y1": 304.461, "r_x2": 545.113, "r_y2": 296.764, "r_x3": 347.44, "r_y3": 296.764, "coord_origin": "TOPLEFT"}, "text": "pdf document conversion using recurrent neural net-", "orig": "pdf document conversion using recurrent neural net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 315.419, "r_x1": 352.847, "r_y1": 315.419, "r_x2": 352.847, "r_y2": 307.722, "r_x3": 328.781, "r_y3": 307.722, "coord_origin": "TOPLEFT"}, "text": "works.", "orig": "works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.236, "r_y0": 315.29, "r_x1": 545.114, "r_y1": 315.29, "r_x2": 545.114, "r_y2": 307.56, "r_x3": 360.236, "r_y3": 307.56, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the AAAI Conference on Artificial", "orig": "Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 203, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 326.249, "r_x1": 371.022, "r_y1": 326.249, "r_x2": 371.022, "r_y2": 318.519, "r_x3": 328.781, "r_y3": 318.519, "coord_origin": "TOPLEFT"}, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 204, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 371.021, "r_y0": 326.378, "r_x1": 502.262, "r_y1": 326.378, "r_x2": 502.262, "r_y2": 318.681, "r_x3": 371.021, "r_y3": 318.681, "coord_origin": "TOPLEFT"}, "text": ", 35(17):15137-15145, May 2021. 1", "orig": ", 35(17):15137-15145, May 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[19] Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Viktor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Robust pdf document conversion using recurrent neural networks. Proceedings of the AAAI Conference on Artificial Intelligence , 35(17):15137-15145, May 2021. 1"}, {"label": "list_item", "id": 18, "page_no": 8, "cluster": {"id": 18, "label": "list_item", "bbox": {"l": 308.862, "t": 330.127, "r": 545.116, "b": 370.701, "coord_origin": "TOPLEFT"}, "confidence": 0.9027292728424072, "cells": [{"index": 205, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 337.824, "r_x1": 323.8, "r_y1": 337.824, "r_x2": 323.8, "r_y2": 330.127, "r_x3": 308.862, "r_y3": 330.127, "coord_origin": "TOPLEFT"}, "text": "[20]", "orig": "[20]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 206, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 337.824, "r_x1": 545.109, "r_y1": 337.824, "r_x2": 545.109, "r_y2": 330.127, "r_x3": 328.785, "r_y3": 330.127, "coord_origin": "TOPLEFT"}, "text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 207, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 348.783, "r_x1": 456.821, "r_y1": 348.783, "r_x2": 456.821, "r_y2": 341.086, "r_x3": 328.781, "r_y3": 341.086, "coord_origin": "TOPLEFT"}, "text": "Yongpan Wang, and Gui-Song Xia.", "orig": "Yongpan Wang, and Gui-Song Xia.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 208, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 460.991, "r_y0": 348.783, "r_x1": 545.113, "r_y1": 348.783, "r_x2": 545.113, "r_y2": 341.086, "r_x3": 460.991, "r_y3": 341.086, "coord_origin": "TOPLEFT"}, "text": "Parsing table structures", "orig": "Parsing table structures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 209, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 359.742, "r_x1": 370.421, "r_y1": 359.742, "r_x2": 370.421, "r_y2": 352.045, "r_x3": 328.781, "r_y3": 352.045, "coord_origin": "TOPLEFT"}, "text": "in the wild.", "orig": "in the wild.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 210, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.308, "r_y0": 359.742, "r_x1": 382.777, "r_y1": 359.742, "r_x2": 382.777, "r_y2": 352.045, "r_x3": 375.308, "r_y3": 352.045, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 211, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.541, "r_y0": 359.613, "r_x1": 545.116, "r_y1": 359.613, "r_x2": 545.116, "r_y2": 351.883, "r_x3": 385.541, "r_y3": 351.883, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE/CVF International", "orig": "Proceedings of the IEEE/CVF International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 212, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 370.572, "r_x1": 443.596, "r_y1": 370.572, "r_x2": 443.596, "r_y2": 362.842, "r_x3": 328.781, "r_y3": 362.842, "coord_origin": "TOPLEFT"}, "text": "Conference on Computer Vision", "orig": "Conference on Computer Vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 213, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 443.594, "r_y0": 370.701, "r_x1": 534.486, "r_y1": 370.701, "r_x2": 534.486, "r_y2": 363.004, "r_x3": 443.594, "r_y3": 363.004, "coord_origin": "TOPLEFT"}, "text": ", pages 944-952, 2021. 2", "orig": ", pages 944-952, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[20] Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang, Yongpan Wang, and Gui-Song Xia. Parsing table structures in the wild. In Proceedings of the IEEE/CVF International Conference on Computer Vision , pages 944-952, 2021. 2"}, {"label": "list_item", "id": 21, "page_no": 8, "cluster": {"id": 21, "label": "list_item", "bbox": {"l": 308.862, "t": 374.449, "r": 545.113, "b": 436.941, "coord_origin": "TOPLEFT"}, "confidence": 0.882714569568634, "cells": [{"index": 214, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 382.146, "r_x1": 323.8, "r_y1": 382.146, "r_x2": 323.8, "r_y2": 374.449, "r_x3": 308.862, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "[21]", "orig": "[21]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 215, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 382.146, "r_x1": 362.66, "r_y1": 382.146, "r_x2": 362.66, "r_y2": 374.449, "r_x3": 328.785, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Shubham", "orig": "Shubham", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 216, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 368.695, "r_y0": 382.146, "r_x1": 389.613, "r_y1": 382.146, "r_x2": 389.613, "r_y2": 374.449, "r_x3": 368.695, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Singh", "orig": "Singh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 217, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.648, "r_y0": 382.146, "r_x1": 424.564, "r_y1": 382.146, "r_x2": 424.564, "r_y2": 374.449, "r_x3": 395.648, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Paliwal,", "orig": "Paliwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 218, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.549, "r_y0": 382.146, "r_x1": 488.504, "r_y1": 382.146, "r_x2": 488.504, "r_y2": 374.449, "r_x3": 431.549, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "D Vishwanath,", "orig": "D Vishwanath,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 219, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 495.48, "r_y0": 382.146, "r_x1": 515.412, "r_y1": 382.146, "r_x2": 515.412, "r_y2": 374.449, "r_x3": 495.48, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Rohit", "orig": "Rohit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 220, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 521.446, "r_y0": 382.146, "r_x1": 545.109, "r_y1": 382.146, "r_x2": 545.109, "r_y2": 374.449, "r_x3": 521.446, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Rahul,", "orig": "Rahul,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 221, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 393.105, "r_x1": 460.318, "r_y1": 393.105, "r_x2": 460.318, "r_y2": 385.408, "r_x3": 328.781, "r_y3": 385.408, "coord_origin": "TOPLEFT"}, "text": "Monika Sharma, and Lovekesh Vig.", "orig": "Monika Sharma, and Lovekesh Vig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 222, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.393, "r_y0": 393.105, "r_x1": 498.542, "r_y1": 393.105, "r_x2": 498.542, "r_y2": 385.408, "r_x3": 465.393, "r_y3": 385.408, "coord_origin": "TOPLEFT"}, "text": "Tablenet:", "orig": "Tablenet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 223, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.469, "r_y0": 393.105, "r_x1": 545.113, "r_y1": 393.105, "r_x2": 545.113, "r_y2": 385.408, "r_x3": 502.469, "r_y3": 385.408, "coord_origin": "TOPLEFT"}, "text": "Deep learn-", "orig": "Deep learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 224, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 404.064, "r_x1": 545.113, "r_y1": 404.064, "r_x2": 545.113, "r_y2": 396.367, "r_x3": 328.781, "r_y3": 396.367, "coord_origin": "TOPLEFT"}, "text": "ing model for end-to-end table detection and tabular data ex-", "orig": "ing model for end-to-end table detection and tabular data ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 225, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 415.023, "r_x1": 478.009, "r_y1": 415.023, "r_x2": 478.009, "r_y2": 407.326, "r_x3": 328.781, "r_y3": 407.326, "coord_origin": "TOPLEFT"}, "text": "traction from scanned document images.", "orig": "traction from scanned document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 226, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 484.07, "r_y0": 415.023, "r_x1": 491.539, "r_y1": 415.023, "r_x2": 491.539, "r_y2": 407.326, "r_x3": 484.07, "r_y3": 407.326, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 227, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 494.668, "r_y0": 414.894, "r_x1": 545.113, "r_y1": 414.894, "r_x2": 545.113, "r_y2": 407.164, "r_x3": 494.668, "r_y3": 407.164, "coord_origin": "TOPLEFT"}, "text": "2019 Interna-", "orig": "2019 Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 228, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 425.853, "r_x1": 349.709, "r_y1": 425.853, "r_x2": 349.709, "r_y2": 418.123, "r_x3": 328.781, "r_y3": 418.123, "coord_origin": "TOPLEFT"}, "text": "tional", "orig": "tional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 229, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 353.295, "r_y0": 425.853, "r_x1": 545.113, "r_y1": 425.853, "r_x2": 545.113, "r_y2": 418.123, "r_x3": 353.295, "r_y3": 418.123, "coord_origin": "TOPLEFT"}, "text": "Conference on Document Analysis and Recognition", "orig": "Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 230, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 436.812, "r_x1": 360.836, "r_y1": 436.812, "r_x2": 360.836, "r_y2": 429.082, "r_x3": 328.781, "r_y3": 429.082, "coord_origin": "TOPLEFT"}, "text": "(ICDAR)", "orig": "(ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 231, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.836, "r_y0": 436.941, "r_x1": 475.633, "r_y1": 436.941, "r_x2": 475.633, "r_y2": 429.244, "r_x3": 360.836, "r_y3": 429.244, "coord_origin": "TOPLEFT"}, "text": ", pages 128-133. IEEE, 2019. 1", "orig": ", pages 128-133. IEEE, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[21] Shubham Singh Paliwal, D Vishwanath, Rohit Rahul, Monika Sharma, and Lovekesh Vig. Tablenet: Deep learning model for end-to-end table detection and tabular data extraction from scanned document images. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 128-133. IEEE, 2019. 1"}, {"label": "list_item", "id": 20, "page_no": 8, "cluster": {"id": 20, "label": "list_item", "bbox": {"l": 308.862, "t": 440.689, "r": 545.115, "b": 557.975, "coord_origin": "TOPLEFT"}, "confidence": 0.8896440863609314, "cells": [{"index": 232, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 448.386, "r_x1": 323.8, "r_y1": 448.386, "r_x2": 323.8, "r_y2": 440.689, "r_x3": 308.862, "r_y3": 440.689, "coord_origin": "TOPLEFT"}, "text": "[22]", "orig": "[22]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 233, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 448.386, "r_x1": 545.109, "r_y1": 448.386, "r_x2": 545.109, "r_y2": 440.689, "r_x3": 328.785, "r_y3": 440.689, "coord_origin": "TOPLEFT"}, "text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 234, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 459.345, "r_x1": 545.113, "r_y1": 459.345, "r_x2": 545.113, "r_y2": 451.648, "r_x3": 328.781, "r_y3": 451.648, "coord_origin": "TOPLEFT"}, "text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 235, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 470.304, "r_x1": 343.477, "r_y1": 470.304, "r_x2": 343.477, "r_y2": 462.607, "r_x3": 328.781, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Lin,", "orig": "Lin,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 236, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.601, "r_y0": 470.304, "r_x1": 373.496, "r_y1": 470.304, "r_x2": 373.496, "r_y2": 462.607, "r_x3": 347.601, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Natalia", "orig": "Natalia", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 237, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.244, "r_y0": 470.304, "r_x1": 420.83, "r_y1": 470.304, "r_x2": 420.83, "r_y2": 462.607, "r_x3": 377.244, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Gimelshein,", "orig": "Gimelshein,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 238, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.955, "r_y0": 470.304, "r_x1": 473.239, "r_y1": 470.304, "r_x2": 473.239, "r_y2": 462.607, "r_x3": 424.955, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Luca Antiga,", "orig": "Luca Antiga,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 239, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.363, "r_y0": 470.304, "r_x1": 545.113, "r_y1": 470.304, "r_x2": 545.113, "r_y2": 462.607, "r_x3": 477.363, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Alban Desmaison,", "orig": "Alban Desmaison,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 240, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 481.263, "r_x1": 545.113, "r_y1": 481.263, "r_x2": 545.113, "r_y2": 473.566, "r_x3": 328.781, "r_y3": 473.566, "coord_origin": "TOPLEFT"}, "text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 241, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 492.222, "r_x1": 545.113, "r_y1": 492.222, "r_x2": 545.113, "r_y2": 484.525, "r_x3": 328.781, "r_y3": 484.525, "coord_origin": "TOPLEFT"}, "text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 242, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 503.181, "r_x1": 545.113, "r_y1": 503.181, "r_x2": 545.113, "r_y2": 495.484, "r_x3": 328.781, "r_y3": 495.484, "coord_origin": "TOPLEFT"}, "text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 243, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 514.14, "r_x1": 545.113, "r_y1": 514.14, "r_x2": 545.113, "r_y2": 506.443, "r_x3": 328.781, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "perative style, high-performance deep learning library. In H.", "orig": "perative style, high-performance deep learning library. In H.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 244, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 525.0989999999999, "r_x1": 545.11, "r_y1": 525.0989999999999, "r_x2": 545.11, "r_y2": 517.402, "r_x3": 328.781, "r_y3": 517.402, "coord_origin": "TOPLEFT"}, "text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4-Buc, E.", "orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4-Buc, E.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 245, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 511.145, "r_y0": 525.0989999999999, "r_x1": 515.126, "r_y1": 525.0989999999999, "r_x2": 515.126, "r_y2": 517.402, "r_x3": 511.145, "r_y3": 517.402, "coord_origin": "TOPLEFT"}, "text": "e", "orig": "e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 246, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 536.057, "r_x1": 434.567, "r_y1": 536.057, "r_x2": 434.567, "r_y2": 528.36, "r_x3": 328.781, "r_y3": 528.36, "coord_origin": "TOPLEFT"}, "text": "Fox, and R. Garnett, editors,", "orig": "Fox, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 247, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.864, "r_y0": 535.928, "r_x1": 545.111, "r_y1": 535.928, "r_x2": 545.111, "r_y2": 528.198, "r_x3": 437.864, "r_y3": 528.198, "coord_origin": "TOPLEFT"}, "text": "Advances in Neural Informa-", "orig": "Advances in Neural Informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 248, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 546.887, "r_x1": 425.735, "r_y1": 546.887, "r_x2": 425.735, "r_y2": 539.157, "r_x3": 328.781, "r_y3": 539.157, "coord_origin": "TOPLEFT"}, "text": "tion Processing Systems 32", "orig": "tion Processing Systems 32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 249, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 425.736, "r_y0": 547.016, "r_x1": 545.115, "r_y1": 547.016, "r_x2": 545.115, "r_y2": 539.319, "r_x3": 425.736, "r_y3": 539.319, "coord_origin": "TOPLEFT"}, "text": ", pages 8024-8035. Curran Asso-", "orig": ", pages 8024-8035. Curran Asso-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 250, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 557.975, "r_x1": 399.741, "r_y1": 557.975, "r_x2": 399.741, "r_y2": 550.278, "r_x3": 328.781, "r_y3": 550.278, "coord_origin": "TOPLEFT"}, "text": "ciates, Inc., 2019. 6", "orig": "ciates, Inc., 2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[22] Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer, James Bradbury, Gregory Chanan, Trevor Killeen, Zeming Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison, Andreas Kopf, Edward Yang, Zachary DeVito, Martin Raison, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner, Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An imperative style, high-performance deep learning library. In H. Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4-Buc, E. e Fox, and R. Garnett, editors, Advances in Neural Information Processing Systems 32 , pages 8024-8035. Curran Associates, Inc., 2019. 6"}, {"label": "list_item", "id": 19, "page_no": 8, "cluster": {"id": 19, "label": "list_item", "bbox": {"l": 308.862, "t": 561.7239999999999, "r": 545.113, "b": 624.215, "coord_origin": "TOPLEFT"}, "confidence": 0.9025435447692871, "cells": [{"index": 251, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.421, "r_x1": 323.8, "r_y1": 569.421, "r_x2": 323.8, "r_y2": 561.7239999999999, "r_x3": 308.862, "r_y3": 561.7239999999999, "coord_origin": "TOPLEFT"}, "text": "[23]", "orig": "[23]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 252, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 569.421, "r_x1": 395.433, "r_y1": 569.421, "r_x2": 395.433, "r_y2": 561.7239999999999, "r_x3": 328.785, "r_y3": 561.7239999999999, "coord_origin": "TOPLEFT"}, "text": "Devashish Prasad,", "orig": "Devashish Prasad,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 253, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 399.369, "r_y0": 569.421, "r_x1": 545.109, "r_y1": 569.421, "r_x2": 545.109, "r_y2": 561.7239999999999, "r_x3": 399.369, "r_y3": 561.7239999999999, "coord_origin": "TOPLEFT"}, "text": "Ayan Gadpal, Kshitij Kapadni, Manish", "orig": "Ayan Gadpal, Kshitij Kapadni, Manish", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 254, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 580.38, "r_x1": 545.113, "r_y1": 580.38, "r_x2": 545.113, "r_y2": 572.683, "r_x3": 328.781, "r_y3": 572.683, "coord_origin": "TOPLEFT"}, "text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 255, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 591.3389999999999, "r_x1": 545.113, "r_y1": 591.3389999999999, "r_x2": 545.113, "r_y2": 583.642, "r_x3": 328.781, "r_y3": 583.642, "coord_origin": "TOPLEFT"}, "text": "for end to end table detection and structure recognition from", "orig": "for end to end table detection and structure recognition from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 256, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 602.298, "r_x1": 418.266, "r_y1": 602.298, "r_x2": 418.266, "r_y2": 594.601, "r_x3": 328.781, "r_y3": 594.601, "coord_origin": "TOPLEFT"}, "text": "image-based documents.", "orig": "image-based documents.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 257, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.148, "r_y0": 602.298, "r_x1": 431.617, "r_y1": 602.298, "r_x2": 431.617, "r_y2": 594.601, "r_x3": 424.148, "r_y3": 594.601, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 258, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 434.691, "r_y0": 602.169, "r_x1": 545.112, "r_y1": 602.169, "r_x2": 545.112, "r_y2": 594.439, "r_x3": 434.691, "r_y3": 594.439, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE/CVF", "orig": "Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 259, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 613.127, "r_x1": 369.784, "r_y1": 613.127, "r_x2": 369.784, "r_y2": 605.3969999999999, "r_x3": 328.781, "r_y3": 605.3969999999999, "coord_origin": "TOPLEFT"}, "text": "Conference", "orig": "Conference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 260, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.008, "r_y0": 613.127, "r_x1": 449.549, "r_y1": 613.127, "r_x2": 449.549, "r_y2": 605.3969999999999, "r_x3": 374.008, "r_y3": 605.3969999999999, "coord_origin": "TOPLEFT"}, "text": "on Computer Vision", "orig": "on Computer Vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 261, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.782, "r_y0": 613.127, "r_x1": 497.636, "r_y1": 613.127, "r_x2": 497.636, "r_y2": 605.3969999999999, "r_x3": 453.782, "r_y3": 605.3969999999999, "coord_origin": "TOPLEFT"}, "text": "and Pattern", "orig": "and Pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 262, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 501.868, "r_y0": 613.127, "r_x1": 545.113, "r_y1": 613.127, "r_x2": 545.113, "r_y2": 605.3969999999999, "r_x3": 501.868, "r_y3": 605.3969999999999, "coord_origin": "TOPLEFT"}, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 263, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 624.086, "r_x1": 367.803, "r_y1": 624.086, "r_x2": 367.803, "r_y2": 616.356, "r_x3": 328.781, "r_y3": 616.356, "coord_origin": "TOPLEFT"}, "text": "Workshops", "orig": "Workshops", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 264, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.802, "r_y0": 624.215, "r_x1": 458.694, "r_y1": 624.215, "r_x2": 458.694, "r_y2": 616.518, "r_x3": 367.802, "r_y3": 616.518, "coord_origin": "TOPLEFT"}, "text": ", pages 572-573, 2020. 1", "orig": ", pages 572-573, 2020. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[23] Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish Visave, and Kavita Sultanpure. Cascadetabnet: An approach for end to end table detection and structure recognition from image-based documents. In Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops , pages 572-573, 2020. 1"}, {"label": "list_item", "id": 23, "page_no": 8, "cluster": {"id": 23, "label": "list_item", "bbox": {"l": 308.862, "t": 627.9639999999999, "r": 545.116, "b": 668.538, "coord_origin": "TOPLEFT"}, "confidence": 0.8777532577514648, "cells": [{"index": 265, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 635.6610000000001, "r_x1": 323.8, "r_y1": 635.6610000000001, "r_x2": 323.8, "r_y2": 627.9639999999999, "r_x3": 308.862, "r_y3": 627.9639999999999, "coord_origin": "TOPLEFT"}, "text": "[24]", "orig": "[24]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 266, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 635.6610000000001, "r_x1": 545.109, "r_y1": 635.6610000000001, "r_x2": 545.109, "r_y2": 627.9639999999999, "r_x3": 328.785, "r_y3": 627.9639999999999, "coord_origin": "TOPLEFT"}, "text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 267, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 646.62, "r_x1": 545.113, "r_y1": 646.62, "r_x2": 545.113, "r_y2": 638.923, "r_x3": 328.781, "r_y3": 638.923, "coord_origin": "TOPLEFT"}, "text": "Rethinking table recognition using graph neural networks.", "orig": "Rethinking table recognition using graph neural networks.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 268, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 657.579, "r_x1": 336.25, "r_y1": 657.579, "r_x2": 336.25, "r_y2": 649.8820000000001, "r_x3": 328.781, "r_y3": 649.8820000000001, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 269, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.1, "r_y0": 657.45, "r_x1": 545.116, "r_y1": 657.45, "r_x2": 545.116, "r_y2": 649.72, "r_x3": 338.1, "r_y3": 649.72, "coord_origin": "TOPLEFT"}, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 270, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 668.409, "r_x1": 406.322, "r_y1": 668.409, "r_x2": 406.322, "r_y2": 660.679, "r_x3": 328.781, "r_y3": 660.679, "coord_origin": "TOPLEFT"}, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 271, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 406.322, "r_y0": 668.538, "r_x1": 521.119, "r_y1": 668.538, "r_x2": 521.119, "r_y2": 660.841, "r_x3": 406.322, "r_y3": 660.841, "coord_origin": "TOPLEFT"}, "text": ", pages 142-147. IEEE, 2019. 3", "orig": ", pages 142-147. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[24] Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait. Rethinking table recognition using graph neural networks. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 142-147. IEEE, 2019. 3"}, {"label": "list_item", "id": 24, "page_no": 8, "cluster": {"id": 24, "label": "list_item", "bbox": {"l": 308.862, "t": 672.2860000000001, "r": 545.113, "b": 712.86, "coord_origin": "TOPLEFT"}, "confidence": 0.8654531240463257, "cells": [{"index": 272, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 679.983, "r_x1": 323.8, "r_y1": 679.983, "r_x2": 323.8, "r_y2": 672.2860000000001, "r_x3": 308.862, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "[25]", "orig": "[25]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 273, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 679.983, "r_x1": 400.857, "r_y1": 679.983, "r_x2": 400.857, "r_y2": 672.2860000000001, "r_x3": 328.785, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "Hamid Rezatofighi,", "orig": "Hamid Rezatofighi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 274, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 405.403, "r_y0": 679.983, "r_x1": 453.571, "r_y1": 679.983, "r_x2": 453.571, "r_y2": 672.2860000000001, "r_x3": 405.403, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "Nathan Tsoi,", "orig": "Nathan Tsoi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 275, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.117, "r_y0": 679.983, "r_x1": 521.635, "r_y1": 679.983, "r_x2": 521.635, "r_y2": 672.2860000000001, "r_x3": 458.117, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "JunYoung Gwak,", "orig": "JunYoung Gwak,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 276, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 526.181, "r_y0": 679.983, "r_x1": 545.109, "r_y1": 679.983, "r_x2": 545.109, "r_y2": 672.2860000000001, "r_x3": 526.181, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "Amir", "orig": "Amir", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 277, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 690.942, "r_x1": 482.815, "r_y1": 690.942, "r_x2": 482.815, "r_y2": 683.245, "r_x3": 328.781, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "Sadeghian, Ian Reid, and Silvio Savarese.", "orig": "Sadeghian, Ian Reid, and Silvio Savarese.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 278, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.751, "r_y0": 690.942, "r_x1": 545.113, "r_y1": 690.942, "r_x2": 545.113, "r_y2": 683.245, "r_x3": 488.751, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "Generalized in-", "orig": "Generalized in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 279, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 701.901, "r_x1": 545.113, "r_y1": 701.901, "r_x2": 545.113, "r_y2": 694.204, "r_x3": 328.781, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "tersection over union: A metric and a loss for bounding box", "orig": "tersection over union: A metric and a loss for bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 280, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 712.86, "r_x1": 367.74, "r_y1": 712.86, "r_x2": 367.74, "r_y2": 705.163, "r_x3": 328.781, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "regression.", "orig": "regression.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 281, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 371.685, "r_y0": 712.86, "r_x1": 379.154, "r_y1": 712.86, "r_x2": 379.154, "r_y2": 705.163, "r_x3": 371.685, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 282, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 381.616, "r_y0": 712.731, "r_x1": 545.109, "r_y1": 712.731, "r_x2": 545.109, "r_y2": 705.001, "r_x3": 381.616, "r_y3": 705.001, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE/CVF Conference on", "orig": "Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[25] Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir Sadeghian, Ian Reid, and Silvio Savarese. Generalized intersection over union: A metric and a loss for bounding box regression. In Proceedings of the IEEE/CVF Conference on"}, {"label": "page_footer", "id": 22, "page_no": 8, "cluster": {"id": 22, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8797808885574341, "cells": [{"index": 283, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9"}], "body": [{"label": "list_item", "id": 25, "page_no": 8, "cluster": {"id": 25, "label": "list_item", "bbox": {"l": 70.031, "t": 76.12599999999998, "r": 286.363, "b": 116.69899999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.7310384511947632, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 83.82299999999998, "r_x1": 212.373, "r_y1": 83.82299999999998, "r_x2": 212.373, "r_y2": 76.12599999999998, "r_x3": 70.031, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "end object detection with transformers.", "orig": "end object detection with transformers.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.313, "r_y0": 83.82299999999998, "r_x1": 286.363, "r_y1": 83.82299999999998, "r_x2": 286.363, "r_y2": 76.12599999999998, "r_x3": 217.313, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "In Andrea Vedaldi,", "orig": "In Andrea Vedaldi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 94.78200000000004, "r_x1": 286.363, "r_y1": 94.78200000000004, "r_x2": 286.363, "r_y2": 87.08500000000004, "r_x3": 70.031, "r_y3": 87.08500000000004, "coord_origin": "TOPLEFT"}, "text": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "orig": "Horst Bischof, Thomas Brox, and Jan-Michael Frahm, edi-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 105.74000000000001, "r_x1": 85.722, "r_y1": 105.74000000000001, "r_x2": 85.722, "r_y2": 98.043, "r_x3": 70.031, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "tors,", "orig": "tors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.889, "r_y0": 105.61099999999999, "r_x1": 199.933, "r_y1": 105.61099999999999, "r_x2": 199.933, "r_y2": 97.88099999999997, "r_x3": 87.889, "r_y3": 97.88099999999997, "coord_origin": "TOPLEFT"}, "text": "Computer Vision - ECCV 2020", "orig": "Computer Vision - ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 199.936, "r_y0": 105.74000000000001, "r_x1": 286.363, "r_y1": 105.74000000000001, "r_x2": 286.363, "r_y2": 98.043, "r_x3": 199.936, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": ", pages 213-229, Cham,", "orig": ", pages 213-229, Cham,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 116.69899999999996, "r_x1": 221.949, "r_y1": 116.69899999999996, "r_x2": 221.949, "r_y2": 109.00199999999995, "r_x3": 70.031, "r_y3": 109.00199999999995, "coord_origin": "TOPLEFT"}, "text": "2020. Springer International Publishing. 5", "orig": "2020. Springer International Publishing. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "end object detection with transformers. In Andrea Vedaldi, Horst Bischof, Thomas Brox, and Jan-Michael Frahm, editors, Computer Vision - ECCV 2020 , pages 213-229, Cham, 2020. Springer International Publishing. 5"}, {"label": "list_item", "id": 9, "page_no": 8, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 54.595, "t": 120.274, "r": 286.363, "b": 149.889, "coord_origin": "TOPLEFT"}, "confidence": 0.9372755885124207, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 127.971, "r_x1": 65.05, "r_y1": 127.971, "r_x2": 65.05, "r_y2": 120.274, "r_x3": 54.595, "r_y3": 120.274, "coord_origin": "TOPLEFT"}, "text": "[2]", "orig": "[2]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 127.971, "r_x1": 286.359, "r_y1": 127.971, "r_x2": 286.359, "r_y2": 120.274, "r_x3": 70.035, "r_y3": 120.274, "coord_origin": "TOPLEFT"}, "text": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "orig": "Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanx-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 138.92999999999995, "r_x1": 179.672, "r_y1": 138.92999999999995, "r_x2": 179.672, "r_y2": 131.23299999999995, "r_x3": 70.031, "r_y3": 131.23299999999995, "coord_origin": "TOPLEFT"}, "text": "uan Yin, and Xian-Ling Mao.", "orig": "uan Yin, and Xian-Ling Mao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.581, "r_y0": 138.92999999999995, "r_x1": 286.363, "r_y1": 138.92999999999995, "r_x2": 286.363, "r_y2": 131.23299999999995, "r_x3": 185.581, "r_y3": 131.23299999999995, "coord_origin": "TOPLEFT"}, "text": "Complicated table structure", "orig": "Complicated table structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 149.889, "r_x1": 113.115, "r_y1": 149.889, "r_x2": 113.115, "r_y2": 142.192, "r_x3": 70.031, "r_y3": 142.192, "coord_origin": "TOPLEFT"}, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.342, "r_y0": 149.76, "r_x1": 235.308, "r_y1": 149.76, "r_x2": 235.308, "r_y2": 142.02999999999997, "r_x3": 116.342, "r_y3": 142.02999999999997, "coord_origin": "TOPLEFT"}, "text": "arXiv preprint arXiv:1908.04729", "orig": "arXiv preprint arXiv:1908.04729", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 235.307, "r_y0": 149.889, "r_x1": 267.676, "r_y1": 149.889, "r_x2": 267.676, "r_y2": 142.192, "r_x3": 235.307, "r_y3": 142.192, "coord_origin": "TOPLEFT"}, "text": ", 2019. 3", "orig": ", 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[2] Zewen Chi, Heyan Huang, Heng-Da Xu, Houjin Yu, Wanxuan Yin, and Xian-Ling Mao. Complicated table structure recognition. arXiv preprint arXiv:1908.04729 , 2019. 3"}, {"label": "list_item", "id": 7, "page_no": 8, "cluster": {"id": 7, "label": "list_item", "bbox": {"l": 54.595, "t": 153.30200000000002, "r": 286.363, "b": 183.07799999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.9378374218940735, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 161.16099999999994, "r_x1": 65.05, "r_y1": 161.16099999999994, "r_x2": 65.05, "r_y2": 153.46400000000006, "r_x3": 54.595, "r_y3": 153.46400000000006, "coord_origin": "TOPLEFT"}, "text": "[3]", "orig": "[3]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 161.16099999999994, "r_x1": 218.779, "r_y1": 161.16099999999994, "r_x2": 218.779, "r_y2": 153.46400000000006, "r_x3": 70.035, "r_y3": 153.46400000000006, "coord_origin": "TOPLEFT"}, "text": "Bertrand Couasnon and Aurelie Lemaitre.", "orig": "Bertrand Couasnon and Aurelie Lemaitre.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.98, "r_y0": 161.03200000000004, "r_x1": 286.363, "r_y1": 161.03200000000004, "r_x2": 286.363, "r_y2": 153.30200000000002, "r_x3": 220.98, "r_y3": 153.30200000000002, "coord_origin": "TOPLEFT"}, "text": "Recognition of Ta-", "orig": "Recognition of Ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 171.99099999999999, "r_x1": 125.264, "r_y1": 171.99099999999999, "r_x2": 125.264, "r_y2": 164.26099999999997, "r_x3": 70.031, "r_y3": 164.26099999999997, "coord_origin": "TOPLEFT"}, "text": "bles and Forms", "orig": "bles and Forms", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.261, "r_y0": 172.12, "r_x1": 127.503, "r_y1": 172.12, "r_x2": 127.503, "r_y2": 164.423, "r_x3": 125.261, "r_y3": 164.423, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.986, "r_y0": 172.12, "r_x1": 286.36, "r_y1": 172.12, "r_x2": 286.36, "r_y2": 164.423, "r_x3": 129.986, "r_y3": 164.423, "coord_origin": "TOPLEFT"}, "text": "pages 647-677. Springer London, London,", "orig": "pages 647-677. Springer London, London,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 183.07799999999997, "r_x1": 97.917, "r_y1": 183.07799999999997, "r_x2": 97.917, "r_y2": 175.38099999999997, "r_x3": 70.031, "r_y3": 175.38099999999997, "coord_origin": "TOPLEFT"}, "text": "2014. 2", "orig": "2014. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[3] Bertrand Couasnon and Aurelie Lemaitre. Recognition of Tables and Forms , pages 647-677. Springer London, London, 2014. 2"}, {"label": "list_item", "id": 0, "page_no": 8, "cluster": {"id": 0, "label": "list_item", "bbox": {"l": 54.595, "t": 186.65300000000002, "r": 286.364, "b": 227.22699999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9648825526237488, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 194.35000000000002, "r_x1": 65.05, "r_y1": 194.35000000000002, "r_x2": 65.05, "r_y2": 186.65300000000002, "r_x3": 54.595, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "[4]", "orig": "[4]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 194.35000000000002, "r_x1": 91.936, "r_y1": 194.35000000000002, "r_x2": 91.936, "r_y2": 186.65300000000002, "r_x3": 70.035, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Herv\u00b4 e", "orig": "Herv\u00b4 e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 97.101, "r_y0": 194.35000000000002, "r_x1": 124.736, "r_y1": 194.35000000000002, "r_x2": 124.736, "r_y2": 186.65300000000002, "r_x3": 97.101, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "D\u00b4jean,", "orig": "D\u00b4jean,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.575, "r_y0": 194.35000000000002, "r_x1": 107.556, "r_y1": 194.35000000000002, "r_x2": 107.556, "r_y2": 186.65300000000002, "r_x3": 103.575, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "e", "orig": "e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 130.636, "r_y0": 194.35000000000002, "r_x1": 163.497, "r_y1": 194.35000000000002, "r_x2": 163.497, "r_y2": 186.65300000000002, "r_x3": 130.636, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Jean-Luc", "orig": "Jean-Luc", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.662, "r_y0": 194.35000000000002, "r_x1": 200.923, "r_y1": 194.35000000000002, "r_x2": 200.923, "r_y2": 186.65300000000002, "r_x3": 168.662, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Meunier,", "orig": "Meunier,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.814, "r_y0": 194.35000000000002, "r_x1": 238.188, "r_y1": 194.35000000000002, "r_x2": 238.188, "r_y2": 186.65300000000002, "r_x3": 206.814, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Liangcai", "orig": "Liangcai", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.352, "r_y0": 194.35000000000002, "r_x1": 260.532, "r_y1": 194.35000000000002, "r_x2": 260.532, "r_y2": 186.65300000000002, "r_x3": 243.352, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Gao,", "orig": "Gao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.432, "r_y0": 194.35000000000002, "r_x1": 286.364, "r_y1": 194.35000000000002, "r_x2": 286.364, "r_y2": 186.65300000000002, "r_x3": 266.432, "r_y3": 186.65300000000002, "coord_origin": "TOPLEFT"}, "text": "Yilun", "orig": "Yilun", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 205.30899999999997, "r_x1": 269.605, "r_y1": 205.30899999999997, "r_x2": 269.605, "r_y2": 197.61199999999997, "r_x3": 70.031, "r_y3": 197.61199999999997, "coord_origin": "TOPLEFT"}, "text": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang.", "orig": "Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.411, "r_y0": 205.30899999999997, "r_x1": 286.363, "r_y1": 205.30899999999997, "r_x2": 286.363, "r_y2": 197.61199999999997, "r_x3": 274.411, "r_y3": 197.61199999999997, "coord_origin": "TOPLEFT"}, "text": "IC-", "orig": "IC-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 216.26800000000003, "r_x1": 286.363, "r_y1": 216.26800000000003, "r_x2": 286.363, "r_y2": 208.57100000000003, "r_x3": 70.031, "r_y3": 208.57100000000003, "coord_origin": "TOPLEFT"}, "text": "DAR 2019 Competition on Table Detection and Recognition", "orig": "DAR 2019 Competition on Table Detection and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 227.22699999999998, "r_x1": 245.835, "r_y1": 227.22699999999998, "r_x2": 245.835, "r_y2": 219.52999999999997, "r_x3": 70.031, "r_y3": 219.52999999999997, "coord_origin": "TOPLEFT"}, "text": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "orig": "(cTDaR), Apr. 2019. http://sac.founderit.com/. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[4] Herv\u00b4 e D\u00b4jean, e Jean-Luc Meunier, Liangcai Gao, Yilun Huang, Yu Fang, Florian Kleber, and Eva-Maria Lang. ICDAR 2019 Competition on Table Detection and Recognition (cTDaR), Apr. 2019. http://sac.founderit.com/. 2"}, {"label": "list_item", "id": 1, "page_no": 8, "cluster": {"id": 1, "label": "list_item", "bbox": {"l": 54.595, "t": 230.80200000000002, "r": 286.363, "b": 271.375, "coord_origin": "TOPLEFT"}, "confidence": 0.9620943069458008, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 238.49900000000002, "r_x1": 65.05, "r_y1": 238.49900000000002, "r_x2": 65.05, "r_y2": 230.80200000000002, "r_x3": 54.595, "r_y3": 230.80200000000002, "coord_origin": "TOPLEFT"}, "text": "[5]", "orig": "[5]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 238.49900000000002, "r_x1": 286.359, "r_y1": 238.49900000000002, "r_x2": 286.359, "r_y2": 230.80200000000002, "r_x3": 70.035, "r_y3": 230.80200000000002, "coord_origin": "TOPLEFT"}, "text": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "orig": "Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 249.45799999999997, "r_x1": 286.363, "r_y1": 249.45799999999997, "r_x2": 286.363, "r_y2": 241.76099999999997, "r_x3": 70.031, "r_y3": 241.76099999999997, "coord_origin": "TOPLEFT"}, "text": "Stavros J Perantonis. Automatic table detection in document", "orig": "Stavros J Perantonis. Automatic table detection in document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 260.41600000000005, "r_x1": 108.398, "r_y1": 260.41600000000005, "r_x2": 108.398, "r_y2": 252.71900000000005, "r_x3": 70.031, "r_y3": 252.71900000000005, "coord_origin": "TOPLEFT"}, "text": "images. In", "orig": "images. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.645, "r_y0": 260.28700000000003, "r_x1": 286.36, "r_y1": 260.28700000000003, "r_x2": 286.36, "r_y2": 252.55700000000002, "r_x3": 110.645, "r_y3": 252.55700000000002, "coord_origin": "TOPLEFT"}, "text": "International Conference on Pattern Recognition", "orig": "International Conference on Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 271.246, "r_x1": 140.579, "r_y1": 271.246, "r_x2": 140.579, "r_y2": 263.51599999999996, "r_x3": 70.031, "r_y3": 263.51599999999996, "coord_origin": "TOPLEFT"}, "text": "and Image Analysis", "orig": "and Image Analysis", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.578, "r_y0": 271.375, "r_x1": 266.475, "r_y1": 271.375, "r_x2": 266.475, "r_y2": 263.678, "r_x3": 140.578, "r_y3": 263.678, "coord_origin": "TOPLEFT"}, "text": ", pages 609-618. Springer, 2005. 2", "orig": ", pages 609-618. Springer, 2005. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[5] Basilios Gatos, Dimitrios Danatsas, Ioannis Pratikakis, and Stavros J Perantonis. Automatic table detection in document images. In International Conference on Pattern Recognition and Image Analysis , pages 609-618. Springer, 2005. 2"}, {"label": "list_item", "id": 2, "page_no": 8, "cluster": {"id": 2, "label": "list_item", "bbox": {"l": 54.595, "t": 274.95000000000005, "r": 286.367, "b": 315.524, "coord_origin": "TOPLEFT"}, "confidence": 0.9555517435073853, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 282.647, "r_x1": 65.05, "r_y1": 282.647, "r_x2": 65.05, "r_y2": 274.95000000000005, "r_x3": 54.595, "r_y3": 274.95000000000005, "coord_origin": "TOPLEFT"}, "text": "[6]", "orig": "[6]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 282.647, "r_x1": 286.367, "r_y1": 282.647, "r_x2": 286.367, "r_y2": 274.95000000000005, "r_x3": 70.035, "r_y3": 274.95000000000005, "coord_origin": "TOPLEFT"}, "text": "MaxG\u00a8bel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "orig": "MaxG\u00a8bel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 94.719, "r_y0": 282.647, "r_x1": 99.202, "r_y1": 282.647, "r_x2": 99.202, "r_y2": 274.95000000000005, "r_x3": 94.719, "r_y3": 274.95000000000005, "coord_origin": "TOPLEFT"}, "text": "o", "orig": "o", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 293.606, "r_x1": 179.574, "r_y1": 293.606, "r_x2": 179.574, "r_y2": 285.909, "r_x3": 70.031, "r_y3": 285.909, "coord_origin": "TOPLEFT"}, "text": "Icdar 2013 table competition.", "orig": "Icdar 2013 table competition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.016, "r_y0": 293.606, "r_x1": 194.485, "r_y1": 293.606, "r_x2": 194.485, "r_y2": 285.909, "r_x3": 187.016, "r_y3": 285.909, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.044, "r_y0": 293.477, "r_x1": 286.363, "r_y1": 293.477, "r_x2": 286.363, "r_y2": 285.747, "r_x3": 198.044, "r_y3": 285.747, "coord_origin": "TOPLEFT"}, "text": "2013 12th International", "orig": "2013 12th International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 304.436, "r_x1": 260.199, "r_y1": 304.436, "r_x2": 260.199, "r_y2": 296.706, "r_x3": 70.031, "r_y3": 296.706, "coord_origin": "TOPLEFT"}, "text": "Conference on Document Analysis and Recognition", "orig": "Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 260.198, "r_y0": 304.565, "r_x1": 262.44, "r_y1": 304.565, "r_x2": 262.44, "r_y2": 296.868, "r_x3": 260.198, "r_y3": 296.868, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 265.945, "r_y0": 304.565, "r_x1": 286.362, "r_y1": 304.565, "r_x2": 286.362, "r_y2": 296.868, "r_x3": 265.945, "r_y3": 296.868, "coord_origin": "TOPLEFT"}, "text": "pages", "orig": "pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 315.524, "r_x1": 142.749, "r_y1": 315.524, "r_x2": 142.749, "r_y2": 307.827, "r_x3": 70.031, "r_y3": 307.827, "coord_origin": "TOPLEFT"}, "text": "1449-1453, 2013. 2", "orig": "1449-1453, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[6] MaxG\u00a8bel, Tamir Hassan, Ermelinda Oro, and Giorgio Orsi. o Icdar 2013 table competition. In 2013 12th International Conference on Document Analysis and Recognition , pages 1449-1453, 2013. 2"}, {"label": "list_item", "id": 4, "page_no": 8, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 54.595, "t": 319.099, "r": 286.363, "b": 348.713, "coord_origin": "TOPLEFT"}, "confidence": 0.9479843378067017, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 326.796, "r_x1": 65.05, "r_y1": 326.796, "r_x2": 65.05, "r_y2": 319.099, "r_x3": 54.595, "r_y3": 319.099, "coord_origin": "TOPLEFT"}, "text": "[7]", "orig": "[7]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 326.796, "r_x1": 199.492, "r_y1": 326.796, "r_x2": 199.492, "r_y2": 319.099, "r_x3": 70.035, "r_y3": 319.099, "coord_origin": "TOPLEFT"}, "text": "EA Green and M Krishnamoorthy.", "orig": "EA Green and M Krishnamoorthy.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.988, "r_y0": 326.796, "r_x1": 286.359, "r_y1": 326.796, "r_x2": 286.359, "r_y2": 319.099, "r_x3": 206.988, "r_y3": 319.099, "coord_origin": "TOPLEFT"}, "text": "Recognition of tables", "orig": "Recognition of tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 337.754, "r_x1": 176.283, "r_y1": 337.754, "r_x2": 176.283, "r_y2": 330.057, "r_x3": 70.031, "r_y3": 330.057, "coord_origin": "TOPLEFT"}, "text": "using table grammars. procs.", "orig": "using table grammars. procs.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 182.604, "r_y0": 337.754, "r_x1": 190.073, "r_y1": 337.754, "r_x2": 190.073, "r_y2": 330.057, "r_x3": 182.604, "r_y3": 330.057, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.283, "r_y0": 337.625, "r_x1": 286.363, "r_y1": 337.625, "r_x2": 286.363, "r_y2": 329.895, "r_x3": 193.283, "r_y3": 329.895, "coord_origin": "TOPLEFT"}, "text": "Symposium on Document", "orig": "Symposium on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 348.584, "r_x1": 206.347, "r_y1": 348.584, "r_x2": 206.347, "r_y2": 340.854, "r_x3": 70.031, "r_y3": 340.854, "coord_origin": "TOPLEFT"}, "text": "Analysis and Recognition (SDAIR'95)", "orig": "Analysis and Recognition (SDAIR'95)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.346, "r_y0": 348.713, "r_x1": 274.822, "r_y1": 348.713, "r_x2": 274.822, "r_y2": 341.016, "r_x3": 206.346, "r_y3": 341.016, "coord_origin": "TOPLEFT"}, "text": ", pages 261-277. 2", "orig": ", pages 261-277. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[7] EA Green and M Krishnamoorthy. Recognition of tables using table grammars. procs. In Symposium on Document Analysis and Recognition (SDAIR'95) , pages 261-277. 2"}, {"label": "list_item", "id": 3, "page_no": 8, "cluster": {"id": 3, "label": "list_item", "bbox": {"l": 54.595, "t": 352.288, "r": 286.363, "b": 403.821, "coord_origin": "TOPLEFT"}, "confidence": 0.9484425187110901, "cells": [{"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 359.985, "r_x1": 65.05, "r_y1": 359.985, "r_x2": 65.05, "r_y2": 352.288, "r_x3": 54.595, "r_y3": 352.288, "coord_origin": "TOPLEFT"}, "text": "[8]", "orig": "[8]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 359.985, "r_x1": 286.359, "r_y1": 359.985, "r_x2": 286.359, "r_y2": 352.288, "r_x3": 70.035, "r_y3": 352.288, "coord_origin": "TOPLEFT"}, "text": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "orig": "Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Di-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 370.944, "r_x1": 234.125, "r_y1": 370.944, "r_x2": 234.125, "r_y2": 363.247, "r_x3": 70.031, "r_y3": 363.247, "coord_origin": "TOPLEFT"}, "text": "dier Stricker, and Muhammad Zeshan Afzal.", "orig": "dier Stricker, and Muhammad Zeshan Afzal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.052, "r_y0": 370.944, "r_x1": 286.363, "r_y1": 370.944, "r_x2": 286.363, "r_y2": 363.247, "r_x3": 240.052, "r_y3": 363.247, "coord_origin": "TOPLEFT"}, "text": "Castabdetec-", "orig": "Castabdetec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 381.903, "r_x1": 85.973, "r_y1": 381.903, "r_x2": 85.973, "r_y2": 374.206, "r_x3": 70.031, "r_y3": 374.206, "coord_origin": "TOPLEFT"}, "text": "tors:", "orig": "tors:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 90.349, "r_y0": 381.903, "r_x1": 286.363, "r_y1": 381.903, "r_x2": 286.363, "r_y2": 374.206, "r_x3": 90.349, "r_y3": 374.206, "coord_origin": "TOPLEFT"}, "text": "Cascade network for table detection in document im-", "orig": "Cascade network for table detection in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 392.862, "r_x1": 286.363, "r_y1": 392.862, "r_x2": 286.363, "r_y2": 385.165, "r_x3": 70.031, "r_y3": 385.165, "coord_origin": "TOPLEFT"}, "text": "ages with recursive feature pyramid and switchable atrous", "orig": "ages with recursive feature pyramid and switchable atrous", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 403.821, "r_x1": 114.576, "r_y1": 403.821, "r_x2": 114.576, "r_y2": 396.124, "r_x3": 70.031, "r_y3": 396.124, "coord_origin": "TOPLEFT"}, "text": "convolution.", "orig": "convolution.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 117.804, "r_y0": 403.692, "r_x1": 186.729, "r_y1": 403.692, "r_x2": 186.729, "r_y2": 395.962, "r_x3": 117.804, "r_y3": 395.962, "coord_origin": "TOPLEFT"}, "text": "Journal of Imaging", "orig": "Journal of Imaging", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 186.728, "r_y0": 403.821, "r_x1": 243.001, "r_y1": 403.821, "r_x2": 243.001, "r_y2": 396.124, "r_x3": 186.728, "r_y3": 396.124, "coord_origin": "TOPLEFT"}, "text": ", 7(10), 2021. 1", "orig": ", 7(10), 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[8] Khurram Azeem Hashmi, Alain Pagani, Marcus Liwicki, Didier Stricker, and Muhammad Zeshan Afzal. Castabdetectors: Cascade network for table detection in document images with recursive feature pyramid and switchable atrous convolution. Journal of Imaging , 7(10), 2021. 1"}, {"label": "list_item", "id": 10, "page_no": 8, "cluster": {"id": 10, "label": "list_item", "bbox": {"l": 54.595, "t": 407.395, "r": 286.36, "b": 437.01, "coord_origin": "TOPLEFT"}, "confidence": 0.9330756664276123, "cells": [{"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.595, "r_y0": 415.092, "r_x1": 65.05, "r_y1": 415.092, "r_x2": 65.05, "r_y2": 407.395, "r_x3": 54.595, "r_y3": 407.395, "coord_origin": "TOPLEFT"}, "text": "[9]", "orig": "[9]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 415.092, "r_x1": 286.359, "r_y1": 415.092, "r_x2": 286.359, "r_y2": 407.395, "r_x3": 70.035, "r_y3": 407.395, "coord_origin": "TOPLEFT"}, "text": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "orig": "Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Gir-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 426.051, "r_x1": 147.133, "r_y1": 426.051, "r_x2": 147.133, "r_y2": 418.354, "r_x3": 70.031, "r_y3": 418.354, "coord_origin": "TOPLEFT"}, "text": "shick. Mask r-cnn. In", "orig": "shick. Mask r-cnn. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.156, "r_y0": 425.922, "r_x1": 286.36, "r_y1": 425.922, "r_x2": 286.36, "r_y2": 418.192, "r_x3": 149.156, "r_y3": 418.192, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE International", "orig": "Proceedings of the IEEE International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 436.881, "r_x1": 213.484, "r_y1": 436.881, "r_x2": 213.484, "r_y2": 429.151, "r_x3": 70.031, "r_y3": 429.151, "coord_origin": "TOPLEFT"}, "text": "Conference on Computer Vision (ICCV)", "orig": "Conference on Computer Vision (ICCV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 213.483, "r_y0": 437.01, "r_x1": 261.041, "r_y1": 437.01, "r_x2": 261.041, "r_y2": 429.313, "r_x3": 213.483, "r_y3": 429.313, "coord_origin": "TOPLEFT"}, "text": ", Oct 2017. 1", "orig": ", Oct 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[9] Kaiming He, Georgia Gkioxari, Piotr Dollar, and Ross Girshick. Mask r-cnn. In Proceedings of the IEEE International Conference on Computer Vision (ICCV) , Oct 2017. 1"}, {"label": "list_item", "id": 14, "page_no": 8, "cluster": {"id": 14, "label": "list_item", "bbox": {"l": 50.112, "t": 440.585, "r": 286.363, "b": 481.159, "coord_origin": "TOPLEFT"}, "confidence": 0.9274735450744629, "cells": [{"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 448.282, "r_x1": 65.05, "r_y1": 448.282, "r_x2": 65.05, "r_y2": 440.585, "r_x3": 50.112, "r_y3": 440.585, "coord_origin": "TOPLEFT"}, "text": "[10]", "orig": "[10]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 448.282, "r_x1": 286.359, "r_y1": 448.282, "r_x2": 286.359, "r_y2": 440.585, "r_x3": 70.035, "r_y3": 440.585, "coord_origin": "TOPLEFT"}, "text": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "orig": "Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bing-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 459.241, "r_x1": 202.743, "r_y1": 459.241, "r_x2": 202.743, "r_y2": 451.544, "r_x3": 70.031, "r_y3": 451.544, "coord_origin": "TOPLEFT"}, "text": "cong Li, Xin Tang, and Rong Xiao.", "orig": "cong Li, Xin Tang, and Rong Xiao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 209.001, "r_y0": 459.241, "r_x1": 286.363, "r_y1": 459.241, "r_x2": 286.363, "r_y2": 451.544, "r_x3": 209.001, "r_y3": 451.544, "coord_origin": "TOPLEFT"}, "text": "Pingan-vcgroup's so-", "orig": "Pingan-vcgroup's so-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 470.2, "r_x1": 286.363, "r_y1": 470.2, "r_x2": 286.363, "r_y2": 462.503, "r_x3": 70.031, "r_y3": 462.503, "coord_origin": "TOPLEFT"}, "text": "lution for icdar 2021 competition on scientific table image", "orig": "lution for icdar 2021 competition on scientific table image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 481.159, "r_x1": 141.87, "r_y1": 481.159, "r_x2": 141.87, "r_y2": 473.462, "r_x3": 70.031, "r_y3": 473.462, "coord_origin": "TOPLEFT"}, "text": "recognition to latex.", "orig": "recognition to latex.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.097, "r_y0": 481.03, "r_x1": 166.016, "r_y1": 481.03, "r_x2": 166.016, "r_y2": 473.3, "r_x3": 145.097, "r_y3": 473.3, "coord_origin": "TOPLEFT"}, "text": "ArXiv", "orig": "ArXiv", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.015, "r_y0": 481.159, "r_x1": 259.902, "r_y1": 481.159, "r_x2": 259.902, "r_y2": 473.462, "r_x3": 166.015, "r_y3": 473.462, "coord_origin": "TOPLEFT"}, "text": ", abs/2105.01846, 2021. 2", "orig": ", abs/2105.01846, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[10] Yelin He, X. Qi, Jiaquan Ye, Peng Gao, Yihao Chen, Bingcong Li, Xin Tang, and Rong Xiao. Pingan-vcgroup's solution for icdar 2021 competition on scientific table image recognition to latex. ArXiv , abs/2105.01846, 2021. 2"}, {"label": "list_item", "id": 11, "page_no": 8, "cluster": {"id": 11, "label": "list_item", "bbox": {"l": 50.112, "t": 484.733, "r": 286.363, "b": 536.266, "coord_origin": "TOPLEFT"}, "confidence": 0.9299950003623962, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 492.43, "r_x1": 65.05, "r_y1": 492.43, "r_x2": 65.05, "r_y2": 484.733, "r_x3": 50.112, "r_y3": 484.733, "coord_origin": "TOPLEFT"}, "text": "[11]", "orig": "[11]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 492.43, "r_x1": 117.091, "r_y1": 492.43, "r_x2": 117.091, "r_y2": 484.733, "r_x3": 70.035, "r_y3": 484.733, "coord_origin": "TOPLEFT"}, "text": "Jianying Hu,", "orig": "Jianying Hu,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 121.054, "r_y0": 492.43, "r_x1": 286.359, "r_y1": 492.43, "r_x2": 286.359, "r_y2": 484.733, "r_x3": 121.054, "r_y3": 484.733, "coord_origin": "TOPLEFT"}, "text": "Ramanujan S Kashi, Daniel P Lopresti, and", "orig": "Ramanujan S Kashi, Daniel P Lopresti, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 503.389, "r_x1": 132.15, "r_y1": 503.389, "r_x2": 132.15, "r_y2": 495.692, "r_x3": 70.031, "r_y3": 495.692, "coord_origin": "TOPLEFT"}, "text": "Gordon Wilfong.", "orig": "Gordon Wilfong.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 137.691, "r_y0": 503.389, "r_x1": 273.362, "r_y1": 503.389, "r_x2": 273.362, "r_y2": 495.692, "r_x3": 137.691, "r_y3": 495.692, "coord_origin": "TOPLEFT"}, "text": "Medium-independent table detection.", "orig": "Medium-independent table detection.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.894, "r_y0": 503.389, "r_x1": 286.363, "r_y1": 503.389, "r_x2": 286.363, "r_y2": 495.692, "r_x3": 278.894, "r_y3": 495.692, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 514.219, "r_x1": 106.883, "r_y1": 514.219, "r_x2": 106.883, "r_y2": 506.489, "r_x3": 70.031, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "Document", "orig": "Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 111.796, "r_y0": 514.219, "r_x1": 155.041, "r_y1": 514.219, "r_x2": 155.041, "r_y2": 506.489, "r_x3": 111.796, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 159.946, "r_y0": 514.219, "r_x1": 173.396, "r_y1": 514.219, "r_x2": 173.396, "r_y2": 506.489, "r_x3": 159.946, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.309, "r_y0": 514.219, "r_x1": 211.046, "r_y1": 514.219, "r_x2": 211.046, "r_y2": 506.489, "r_x3": 178.309, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "Retrieval", "orig": "Retrieval", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 215.959, "r_y0": 514.219, "r_x1": 227.409, "r_y1": 514.219, "r_x2": 227.409, "r_y2": 506.489, "r_x3": 215.959, "r_y3": 506.489, "coord_origin": "TOPLEFT"}, "text": "VII", "orig": "VII", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.405, "r_y0": 514.348, "r_x1": 229.647, "r_y1": 514.348, "r_x2": 229.647, "r_y2": 506.651, "r_x3": 227.405, "r_y3": 506.651, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 234.56, "r_y0": 514.348, "r_x1": 261.28, "r_y1": 514.348, "r_x2": 261.28, "r_y2": 506.651, "r_x3": 234.56, "r_y3": 506.651, "coord_origin": "TOPLEFT"}, "text": "volume", "orig": "volume", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 266.185, "r_y0": 514.348, "r_x1": 286.359, "r_y1": 514.348, "r_x2": 286.359, "r_y2": 506.651, "r_x3": 266.185, "r_y3": 506.651, "coord_origin": "TOPLEFT"}, "text": "3967,", "orig": "3967,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 525.307, "r_x1": 286.363, "r_y1": 525.307, "r_x2": 286.363, "r_y2": 517.61, "r_x3": 70.031, "r_y3": 517.61, "coord_origin": "TOPLEFT"}, "text": "pages 291-302. International Society for Optics and Photon-", "orig": "pages 291-302. International Society for Optics and Photon-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 536.266, "r_x1": 112.361, "r_y1": 536.266, "r_x2": 112.361, "r_y2": 528.569, "r_x3": 70.031, "r_y3": 528.569, "coord_origin": "TOPLEFT"}, "text": "ics, 1999. 2", "orig": "ics, 1999. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[11] Jianying Hu, Ramanujan S Kashi, Daniel P Lopresti, and Gordon Wilfong. Medium-independent table detection. In Document Recognition and Retrieval VII , volume 3967, pages 291-302. International Society for Optics and Photonics, 1999. 2"}, {"label": "list_item", "id": 5, "page_no": 8, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 50.112, "t": 539.841, "r": 286.363, "b": 591.373, "coord_origin": "TOPLEFT"}, "confidence": 0.9394103288650513, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 547.538, "r_x1": 65.05, "r_y1": 547.538, "r_x2": 65.05, "r_y2": 539.841, "r_x3": 50.112, "r_y3": 539.841, "coord_origin": "TOPLEFT"}, "text": "[12]", "orig": "[12]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 547.538, "r_x1": 126.407, "r_y1": 547.538, "r_x2": 126.407, "r_y2": 539.841, "r_x3": 70.035, "r_y3": 539.841, "coord_origin": "TOPLEFT"}, "text": "Matthew Hurst.", "orig": "Matthew Hurst.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 130.648, "r_y0": 547.538, "r_x1": 286.359, "r_y1": 547.538, "r_x2": 286.359, "r_y2": 539.841, "r_x3": 130.648, "r_y3": 539.841, "coord_origin": "TOPLEFT"}, "text": "A constraint-based approach to table struc-", "orig": "A constraint-based approach to table struc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 558.4970000000001, "r_x1": 124.654, "r_y1": 558.4970000000001, "r_x2": 124.654, "r_y2": 550.8, "r_x3": 70.031, "r_y3": 550.8, "coord_origin": "TOPLEFT"}, "text": "ture derivation.", "orig": "ture derivation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.815, "r_y0": 558.4970000000001, "r_x1": 136.284, "r_y1": 558.4970000000001, "r_x2": 136.284, "r_y2": 550.8, "r_x3": 128.815, "r_y3": 550.8, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 138.811, "r_y0": 558.3679999999999, "r_x1": 286.362, "r_y1": 558.3679999999999, "r_x2": 286.362, "r_y2": 550.638, "r_x3": 138.811, "r_y3": 550.638, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the Seventh International", "orig": "Proceedings of the Seventh International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 569.327, "r_x1": 286.363, "r_y1": 569.327, "r_x2": 286.363, "r_y2": 561.597, "r_x3": 70.031, "r_y3": 561.597, "coord_origin": "TOPLEFT"}, "text": "Conference on Document Analysis and Recognition - Volume", "orig": "Conference on Document Analysis and Recognition - Volume", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 580.2860000000001, "r_x1": 74.514, "r_y1": 580.2860000000001, "r_x2": 74.514, "r_y2": 572.556, "r_x3": 70.031, "r_y3": 572.556, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 74.514, "r_y0": 580.415, "r_x1": 76.756, "r_y1": 580.415, "r_x2": 76.756, "r_y2": 572.718, "r_x3": 74.514, "r_y3": 572.718, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 79.06, "r_y0": 580.415, "r_x1": 286.363, "r_y1": 580.415, "r_x2": 286.363, "r_y2": 572.718, "r_x3": 79.06, "r_y3": 572.718, "coord_origin": "TOPLEFT"}, "text": "ICDAR '03, page 911, USA, 2003. IEEE Computer Soci-", "orig": "ICDAR '03, page 911, USA, 2003. IEEE Computer Soci-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 591.373, "r_x1": 82.647, "r_y1": 591.373, "r_x2": 82.647, "r_y2": 583.6759999999999, "r_x3": 70.031, "r_y3": 583.6759999999999, "coord_origin": "TOPLEFT"}, "text": "ety.", "orig": "ety.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 85.875, "r_y0": 591.373, "r_x1": 90.358, "r_y1": 591.373, "r_x2": 90.358, "r_y2": 583.6759999999999, "r_x3": 85.875, "r_y3": 583.6759999999999, "coord_origin": "TOPLEFT"}, "text": "2", "orig": "2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[12] Matthew Hurst. A constraint-based approach to table structure derivation. In Proceedings of the Seventh International Conference on Document Analysis and Recognition - Volume 2 , ICDAR '03, page 911, USA, 2003. IEEE Computer Society. 2"}, {"label": "list_item", "id": 13, "page_no": 8, "cluster": {"id": 13, "label": "list_item", "bbox": {"l": 50.112, "t": 594.948, "r": 286.363, "b": 646.481, "coord_origin": "TOPLEFT"}, "confidence": 0.9298838973045349, "cells": [{"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 602.645, "r_x1": 65.05, "r_y1": 602.645, "r_x2": 65.05, "r_y2": 594.948, "r_x3": 50.112, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "[13]", "orig": "[13]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 602.645, "r_x1": 116.302, "r_y1": 602.645, "r_x2": 116.302, "r_y2": 594.948, "r_x3": 70.035, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Thotreingam", "orig": "Thotreingam", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 121.368, "r_y0": 602.645, "r_x1": 144.161, "r_y1": 602.645, "r_x2": 144.161, "r_y2": 594.948, "r_x3": 121.368, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Kasar,", "orig": "Kasar,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.926, "r_y0": 602.645, "r_x1": 186.796, "r_y1": 602.645, "r_x2": 186.796, "r_y2": 594.948, "r_x3": 149.926, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Philippine", "orig": "Philippine", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 191.862, "r_y0": 602.645, "r_x1": 217.013, "r_y1": 602.645, "r_x2": 217.013, "r_y2": 594.948, "r_x3": 191.862, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Barlas,", "orig": "Barlas,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 222.778, "r_y0": 602.645, "r_x1": 257.146, "r_y1": 602.645, "r_x2": 257.146, "r_y2": 594.948, "r_x3": 222.778, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Sebastien", "orig": "Sebastien", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.203, "r_y0": 602.645, "r_x1": 286.359, "r_y1": 602.645, "r_x2": 286.359, "r_y2": 594.948, "r_x3": 262.203, "r_y3": 594.948, "coord_origin": "TOPLEFT"}, "text": "Adam,", "orig": "Adam,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 613.604, "r_x1": 214.838, "r_y1": 613.604, "r_x2": 214.838, "r_y2": 605.907, "r_x3": 70.031, "r_y3": 605.907, "coord_origin": "TOPLEFT"}, "text": "Cl\u00b4ment Chatelain, and Thierry Paquet.", "orig": "Cl\u00b4ment Chatelain, and Thierry Paquet.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.504, "r_y0": 613.604, "r_x1": 82.485, "r_y1": 613.604, "r_x2": 82.485, "r_y2": 605.907, "r_x3": 78.504, "r_y3": 605.907, "coord_origin": "TOPLEFT"}, "text": "e", "orig": "e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.949, "r_y0": 613.604, "r_x1": 286.363, "r_y1": 613.604, "r_x2": 286.363, "r_y2": 605.907, "r_x3": 219.949, "r_y3": 605.907, "coord_origin": "TOPLEFT"}, "text": "Learning to detect", "orig": "Learning to detect", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 624.563, "r_x1": 286.363, "r_y1": 624.563, "r_x2": 286.363, "r_y2": 616.866, "r_x3": 70.031, "r_y3": 616.866, "coord_origin": "TOPLEFT"}, "text": "tables in scanned document images using line information.", "orig": "tables in scanned document images using line information.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 635.5219999999999, "r_x1": 77.5, "r_y1": 635.5219999999999, "r_x2": 77.5, "r_y2": 627.825, "r_x3": 70.031, "r_y3": 627.825, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 79.92, "r_y0": 635.393, "r_x1": 286.362, "r_y1": 635.393, "r_x2": 286.362, "r_y2": 627.663, "r_x3": 79.92, "r_y3": 627.663, "coord_origin": "TOPLEFT"}, "text": "2013 12th International Conference on Document Analy-", "orig": "2013 12th International Conference on Document Analy-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 646.352, "r_x1": 140.677, "r_y1": 646.352, "r_x2": 140.677, "r_y2": 638.6220000000001, "r_x3": 70.031, "r_y3": 638.6220000000001, "coord_origin": "TOPLEFT"}, "text": "sis and Recognition", "orig": "sis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 140.676, "r_y0": 646.481, "r_x1": 264.439, "r_y1": 646.481, "r_x2": 264.439, "r_y2": 638.784, "r_x3": 140.676, "r_y3": 638.784, "coord_origin": "TOPLEFT"}, "text": ", pages 1185-1189. IEEE, 2013. 2", "orig": ", pages 1185-1189. IEEE, 2013. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[13] Thotreingam Kasar, Philippine Barlas, Sebastien Adam, Cl\u00b4ment Chatelain, and Thierry Paquet. e Learning to detect tables in scanned document images using line information. In 2013 12th International Conference on Document Analysis and Recognition , pages 1185-1189. IEEE, 2013. 2"}, {"label": "list_item", "id": 17, "page_no": 8, "cluster": {"id": 17, "label": "list_item", "bbox": {"l": 50.112, "t": 650.056, "r": 286.363, "b": 679.67, "coord_origin": "TOPLEFT"}, "confidence": 0.9115257263183594, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 657.7529999999999, "r_x1": 65.05, "r_y1": 657.7529999999999, "r_x2": 65.05, "r_y2": 650.056, "r_x3": 50.112, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "[14]", "orig": "[14]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 657.7529999999999, "r_x1": 91.447, "r_y1": 657.7529999999999, "r_x2": 91.447, "r_y2": 650.056, "r_x3": 70.035, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Pratik", "orig": "Pratik", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.092, "r_y0": 657.7529999999999, "r_x1": 119.745, "r_y1": 657.7529999999999, "r_x2": 119.745, "r_y2": 650.056, "r_x3": 96.092, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Kayal,", "orig": "Kayal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.99, "r_y0": 657.7529999999999, "r_x1": 149.397, "r_y1": 657.7529999999999, "r_x2": 149.397, "r_y2": 650.056, "r_x3": 124.99, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Mrinal", "orig": "Mrinal", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.042, "r_y0": 657.7529999999999, "r_x1": 180.188, "r_y1": 657.7529999999999, "r_x2": 180.188, "r_y2": 650.056, "r_x3": 154.042, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Anand,", "orig": "Anand,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.433, "r_y0": 657.7529999999999, "r_x1": 206.845, "r_y1": 657.7529999999999, "r_x2": 206.845, "r_y2": 650.056, "r_x3": 185.433, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Harsh", "orig": "Harsh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 211.489, "r_y0": 657.7529999999999, "r_x1": 234.147, "r_y1": 657.7529999999999, "r_x2": 234.147, "r_y2": 650.056, "r_x3": 211.489, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Desai,", "orig": "Desai,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.393, "r_y0": 657.7529999999999, "r_x1": 252.34, "r_y1": 657.7529999999999, "r_x2": 252.34, "r_y2": 650.056, "r_x3": 239.393, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 256.976, "r_y0": 657.7529999999999, "r_x1": 286.359, "r_y1": 657.7529999999999, "r_x2": 286.359, "r_y2": 650.056, "r_x3": 256.976, "r_y3": 650.056, "coord_origin": "TOPLEFT"}, "text": "Mayank", "orig": "Mayank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 668.711, "r_x1": 93.2, "r_y1": 668.711, "r_x2": 93.2, "r_y2": 661.014, "r_x3": 70.031, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "Singh.", "orig": "Singh.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 102.202, "r_y0": 668.711, "r_x1": 120.619, "r_y1": 668.711, "r_x2": 120.619, "r_y2": 661.014, "r_x3": 102.202, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "Icdar", "orig": "Icdar", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.672, "r_y0": 668.711, "r_x1": 238.922, "r_y1": 668.711, "r_x2": 238.922, "r_y2": 661.014, "r_x3": 124.672, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "2021 competition on scientific", "orig": "2021 competition on scientific", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.975, "r_y0": 668.711, "r_x1": 260.406, "r_y1": 668.711, "r_x2": 260.406, "r_y2": 661.014, "r_x3": 242.975, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 264.449, "r_y0": 668.711, "r_x1": 286.363, "r_y1": 668.711, "r_x2": 286.363, "r_y2": 661.014, "r_x3": 264.449, "r_y3": 661.014, "coord_origin": "TOPLEFT"}, "text": "image", "orig": "image", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 679.67, "r_x1": 171.997, "r_y1": 679.67, "r_x2": 171.997, "r_y2": 671.973, "r_x3": 70.031, "r_y3": 671.973, "coord_origin": "TOPLEFT"}, "text": "recognition to latex, 2021. 2", "orig": "recognition to latex, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[14] Pratik Kayal, Mrinal Anand, Harsh Desai, and Mayank Singh. Icdar 2021 competition on scientific table image recognition to latex, 2021. 2"}, {"label": "list_item", "id": 16, "page_no": 8, "cluster": {"id": 16, "label": "list_item", "bbox": {"l": 50.112, "t": 683.245, "r": 286.359, "b": 712.86, "coord_origin": "TOPLEFT"}, "confidence": 0.912230372428894, "cells": [{"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 690.942, "r_x1": 65.05, "r_y1": 690.942, "r_x2": 65.05, "r_y2": 683.245, "r_x3": 50.112, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "[15]", "orig": "[15]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 690.942, "r_x1": 286.359, "r_y1": 690.942, "r_x2": 286.359, "r_y2": 683.245, "r_x3": 70.035, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "Harold WKuhn. The hungarian method for the assignment", "orig": "Harold WKuhn. The hungarian method for the assignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 701.901, "r_x1": 102.158, "r_y1": 701.901, "r_x2": 102.158, "r_y2": 694.204, "r_x3": 70.031, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "problem.", "orig": "problem.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 107.55, "r_y0": 701.772, "r_x1": 231.475, "r_y1": 701.772, "r_x2": 231.475, "r_y2": 694.042, "r_x3": 107.55, "r_y3": 694.042, "coord_origin": "TOPLEFT"}, "text": "Naval research logistics quarterly", "orig": "Naval research logistics quarterly", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 231.476, "r_y0": 701.901, "r_x1": 233.718, "r_y1": 701.901, "r_x2": 233.718, "r_y2": 694.204, "r_x3": 231.476, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 236.802, "r_y0": 701.901, "r_x1": 286.359, "r_y1": 701.901, "r_x2": 286.359, "r_y2": 694.204, "r_x3": 236.802, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "2(1-2):83-97,", "orig": "2(1-2):83-97,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 712.86, "r_x1": 97.917, "r_y1": 712.86, "r_x2": 97.917, "r_y2": 705.163, "r_x3": 70.031, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "1955. 6", "orig": "1955. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[15] Harold WKuhn. The hungarian method for the assignment problem. Naval research logistics quarterly , 2(1-2):83-97, 1955. 6"}, {"label": "list_item", "id": 6, "page_no": 8, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 308.862, "t": 76.12599999999998, "r": 545.115, "b": 138.61699999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9389600157737732, "cells": [{"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 83.82299999999998, "r_x1": 323.8, "r_y1": 83.82299999999998, "r_x2": 323.8, "r_y2": 76.12599999999998, "r_x3": 308.862, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "[16]", "orig": "[16]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 83.82299999999998, "r_x1": 351.192, "r_y1": 83.82299999999998, "r_x2": 351.192, "r_y2": 76.12599999999998, "r_x3": 328.785, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Girish", "orig": "Girish", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 355.308, "r_y0": 83.82299999999998, "r_x1": 389.291, "r_y1": 83.82299999999998, "r_x2": 389.291, "r_y2": 76.12599999999998, "r_x3": 355.308, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Kulkarni,", "orig": "Kulkarni,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 393.863, "r_y0": 83.82299999999998, "r_x1": 420.225, "r_y1": 83.82299999999998, "r_x2": 420.225, "r_y2": 76.12599999999998, "r_x3": 393.863, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Visruth", "orig": "Visruth", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.331, "r_y0": 83.82299999999998, "r_x1": 454.961, "r_y1": 83.82299999999998, "r_x2": 454.961, "r_y2": 76.12599999999998, "r_x3": 424.331, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Premraj,", "orig": "Premraj,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.533, "r_y0": 83.82299999999998, "r_x1": 486.881, "r_y1": 83.82299999999998, "r_x2": 486.881, "r_y2": 76.12599999999998, "r_x3": 459.533, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Vicente", "orig": "Vicente", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.988, "r_y0": 83.82299999999998, "r_x1": 524.1, "r_y1": 83.82299999999998, "r_x2": 524.1, "r_y2": 76.12599999999998, "r_x3": 490.988, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Ordonez,", "orig": "Ordonez,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.673, "r_y0": 83.82299999999998, "r_x1": 545.109, "r_y1": 83.82299999999998, "r_x2": 545.109, "r_y2": 76.12599999999998, "r_x3": 528.673, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "Sag-", "orig": "Sag-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 94.78099999999995, "r_x1": 545.113, "r_y1": 94.78099999999995, "r_x2": 545.113, "r_y2": 87.08399999999995, "r_x3": 328.781, "r_y3": 87.08399999999995, "coord_origin": "TOPLEFT"}, "text": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "orig": "nik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 105.74000000000001, "r_x1": 390.963, "r_y1": 105.74000000000001, "r_x2": 390.963, "r_y2": 98.043, "r_x3": 328.781, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "Tamara L. Berg.", "orig": "Tamara L. Berg.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.27, "r_y0": 105.74000000000001, "r_x1": 435.14, "r_y1": 105.74000000000001, "r_x2": 435.14, "r_y2": 98.043, "r_x3": 400.27, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "Babytalk:", "orig": "Babytalk:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 441.713, "r_y0": 105.74000000000001, "r_x1": 494.507, "r_y1": 105.74000000000001, "r_x2": 494.507, "r_y2": 98.043, "r_x3": 441.713, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "Understanding", "orig": "Understanding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.649, "r_y0": 105.74000000000001, "r_x1": 545.113, "r_y1": 105.74000000000001, "r_x2": 545.113, "r_y2": 98.043, "r_x3": 498.649, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "and generat-", "orig": "and generat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 116.69899999999996, "r_x1": 440.807, "r_y1": 116.69899999999996, "r_x2": 440.807, "r_y2": 109.00199999999995, "r_x3": 328.781, "r_y3": 109.00199999999995, "coord_origin": "TOPLEFT"}, "text": "ing simple image descriptions.", "orig": "ing simple image descriptions.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 446.635, "r_y0": 116.57000000000005, "r_x1": 545.113, "r_y1": 116.57000000000005, "r_x2": 545.113, "r_y2": 108.84000000000003, "r_x3": 446.635, "r_y3": 108.84000000000003, "coord_origin": "TOPLEFT"}, "text": "IEEE Transactions on Pat-", "orig": "IEEE Transactions on Pat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 127.529, "r_x1": 471.132, "r_y1": 127.529, "r_x2": 471.132, "r_y2": 119.79899999999998, "r_x3": 328.781, "r_y3": 119.79899999999998, "coord_origin": "TOPLEFT"}, "text": "tern Analysis and Machine Intelligence", "orig": "tern Analysis and Machine Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 471.133, "r_y0": 127.65800000000002, "r_x1": 473.375, "r_y1": 127.65800000000002, "r_x2": 473.375, "r_y2": 119.96100000000001, "r_x3": 471.133, "r_y3": 119.96100000000001, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 476.127, "r_y0": 127.65800000000002, "r_x1": 545.115, "r_y1": 127.65800000000002, "r_x2": 545.115, "r_y2": 119.96100000000001, "r_x3": 476.127, "r_y3": 119.96100000000001, "coord_origin": "TOPLEFT"}, "text": "35(12):2891-2903,", "orig": "35(12):2891-2903,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 138.61699999999996, "r_x1": 356.667, "r_y1": 138.61699999999996, "r_x2": 356.667, "r_y2": 130.91999999999996, "r_x3": 328.781, "r_y3": 130.91999999999996, "coord_origin": "TOPLEFT"}, "text": "2013. 4", "orig": "2013. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[16] Girish Kulkarni, Visruth Premraj, Vicente Ordonez, Sagnik Dhar, Siming Li, Yejin Choi, Alexander C. Berg, and Tamara L. Berg. Babytalk: Understanding and generating simple image descriptions. IEEE Transactions on Pattern Analysis and Machine Intelligence , 35(12):2891-2903, 2013. 4"}, {"label": "list_item", "id": 15, "page_no": 8, "cluster": {"id": 15, "label": "list_item", "bbox": {"l": 308.862, "t": 142.36599999999999, "r": 545.113, "b": 171.98000000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9253129959106445, "cells": [{"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 150.063, "r_x1": 323.8, "r_y1": 150.063, "r_x2": 323.8, "r_y2": 142.36599999999999, "r_x3": 308.862, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "[17]", "orig": "[17]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 150.063, "r_x1": 375.698, "r_y1": 150.063, "r_x2": 375.698, "r_y2": 142.36599999999999, "r_x3": 328.785, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Minghao Li,", "orig": "Minghao Li,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 380.557, "r_y0": 150.063, "r_x1": 392.51, "r_y1": 150.063, "r_x2": 392.51, "r_y2": 142.36599999999999, "r_x3": 380.557, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Lei", "orig": "Lei", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.84, "r_y0": 150.063, "r_x1": 412.038, "r_y1": 150.063, "r_x2": 412.038, "r_y2": 142.36599999999999, "r_x3": 396.84, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Cui,", "orig": "Cui,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 416.889, "r_y0": 150.063, "r_x1": 478.246, "r_y1": 150.063, "r_x2": 478.246, "r_y2": 142.36599999999999, "r_x3": 416.889, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Shaohan Huang,", "orig": "Shaohan Huang,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.097, "r_y0": 150.063, "r_x1": 500.035, "r_y1": 150.063, "r_x2": 500.035, "r_y2": 142.36599999999999, "r_x3": 483.097, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Furu", "orig": "Furu", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 504.365, "r_y0": 150.063, "r_x1": 520.828, "r_y1": 150.063, "r_x2": 520.828, "r_y2": 142.36599999999999, "r_x3": 504.365, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Wei,", "orig": "Wei,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 525.679, "r_y0": 150.063, "r_x1": 545.109, "r_y1": 150.063, "r_x2": 545.109, "r_y2": 142.36599999999999, "r_x3": 525.679, "r_y3": 142.36599999999999, "coord_origin": "TOPLEFT"}, "text": "Ming", "orig": "Ming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 161.02099999999996, "r_x1": 414.446, "r_y1": 161.02099999999996, "r_x2": 414.446, "r_y2": 153.32399999999996, "r_x3": 328.781, "r_y3": 153.32399999999996, "coord_origin": "TOPLEFT"}, "text": "Zhou, and Zhoujun Li.", "orig": "Zhou, and Zhoujun Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 421.825, "r_y0": 161.02099999999996, "r_x1": 461.448, "r_y1": 161.02099999999996, "r_x2": 461.448, "r_y2": 153.32399999999996, "r_x3": 421.825, "r_y3": 153.32399999999996, "coord_origin": "TOPLEFT"}, "text": "Tablebank:", "orig": "Tablebank:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.828, "r_y0": 161.02099999999996, "r_x1": 545.113, "r_y1": 161.02099999999996, "r_x2": 545.113, "r_y2": 153.32399999999996, "r_x3": 466.828, "r_y3": 153.32399999999996, "coord_origin": "TOPLEFT"}, "text": "A benchmark dataset", "orig": "A benchmark dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 171.98000000000002, "r_x1": 493.628, "r_y1": 171.98000000000002, "r_x2": 493.628, "r_y2": 164.28300000000002, "r_x3": 328.781, "r_y3": 164.28300000000002, "coord_origin": "TOPLEFT"}, "text": "for table detection and recognition, 2019. 2, 3", "orig": "for table detection and recognition, 2019. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[17] Minghao Li, Lei Cui, Shaohan Huang, Furu Wei, Ming Zhou, and Zhoujun Li. Tablebank: A benchmark dataset for table detection and recognition, 2019. 2, 3"}, {"label": "list_item", "id": 12, "page_no": 8, "cluster": {"id": 12, "label": "list_item", "bbox": {"l": 308.862, "t": 175.72900000000004, "r": 545.113, "b": 260.13800000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.9299732446670532, "cells": [{"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 183.42600000000004, "r_x1": 323.8, "r_y1": 183.42600000000004, "r_x2": 323.8, "r_y2": 175.72900000000004, "r_x3": 308.862, "r_y3": 175.72900000000004, "coord_origin": "TOPLEFT"}, "text": "[18]", "orig": "[18]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 183.42600000000004, "r_x1": 545.109, "r_y1": 183.42600000000004, "r_x2": 545.109, "r_y2": 175.72900000000004, "r_x3": 328.785, "r_y3": 175.72900000000004, "coord_origin": "TOPLEFT"}, "text": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "orig": "Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 194.385, "r_x1": 375.397, "r_y1": 194.385, "r_x2": 375.397, "r_y2": 186.688, "r_x3": 328.781, "r_y3": 186.688, "coord_origin": "TOPLEFT"}, "text": "Xianhui Liu.", "orig": "Xianhui Liu.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 381.154, "r_y0": 194.385, "r_x1": 399.58, "r_y1": 194.385, "r_x2": 399.58, "r_y2": 186.688, "r_x3": 381.154, "r_y3": 186.688, "coord_origin": "TOPLEFT"}, "text": "Gfte:", "orig": "Gfte:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 403.937, "r_y0": 194.385, "r_x1": 545.113, "r_y1": 194.385, "r_x2": 545.113, "r_y2": 186.688, "r_x3": 403.937, "r_y3": 186.688, "coord_origin": "TOPLEFT"}, "text": "Graph-based financial table extraction.", "orig": "Graph-based financial table extraction.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 205.34400000000005, "r_x1": 545.113, "r_y1": 205.34400000000005, "r_x2": 545.113, "r_y2": 197.64700000000005, "r_x3": 328.781, "r_y3": 197.64700000000005, "coord_origin": "TOPLEFT"}, "text": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "orig": "In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Gio-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 216.303, "r_x1": 545.113, "r_y1": 216.303, "r_x2": 545.113, "r_y2": 208.606, "r_x3": 328.781, "r_y3": 208.606, "coord_origin": "TOPLEFT"}, "text": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "orig": "vanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 227.26199999999994, "r_x1": 365.382, "r_y1": 227.26199999999994, "r_x2": 365.382, "r_y2": 219.56500000000005, "r_x3": 328.781, "r_y3": 219.56500000000005, "coord_origin": "TOPLEFT"}, "text": "Escalante,", "orig": "Escalante,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 369.237, "r_y0": 227.26199999999994, "r_x1": 479.264, "r_y1": 227.26199999999994, "r_x2": 479.264, "r_y2": 219.56500000000005, "r_x3": 369.237, "r_y3": 219.56500000000005, "coord_origin": "TOPLEFT"}, "text": "and Roberto Vezzani, editors,", "orig": "and Roberto Vezzani, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.119, "r_y0": 227.13300000000004, "r_x1": 545.113, "r_y1": 227.13300000000004, "r_x2": 545.113, "r_y2": 219.40300000000002, "r_x3": 483.119, "r_y3": 219.40300000000002, "coord_origin": "TOPLEFT"}, "text": "Pattern Recogni-", "orig": "Pattern Recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 238.091, "r_x1": 519.398, "r_y1": 238.091, "r_x2": 519.398, "r_y2": 230.361, "r_x3": 328.781, "r_y3": 230.361, "coord_origin": "TOPLEFT"}, "text": "tion. ICPR International Workshops and Challenges", "orig": "tion. ICPR International Workshops and Challenges", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 519.401, "r_y0": 238.22000000000003, "r_x1": 521.643, "r_y1": 238.22000000000003, "r_x2": 521.643, "r_y2": 230.52300000000002, "r_x3": 519.401, "r_y3": 230.52300000000002, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 524.691, "r_y0": 238.22000000000003, "r_x1": 545.108, "r_y1": 238.22000000000003, "r_x2": 545.108, "r_y2": 230.52300000000002, "r_x3": 524.691, "r_y3": 230.52300000000002, "coord_origin": "TOPLEFT"}, "text": "pages", "orig": "pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 249.17899999999997, "r_x1": 545.113, "r_y1": 249.17899999999997, "r_x2": 545.113, "r_y2": 241.48199999999997, "r_x3": 328.781, "r_y3": 241.48199999999997, "coord_origin": "TOPLEFT"}, "text": "644-658, Cham, 2021. Springer International Publishing. 2,", "orig": "644-658, Cham, 2021. Springer International Publishing. 2,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 260.13800000000003, "r_x1": 333.264, "r_y1": 260.13800000000003, "r_x2": 333.264, "r_y2": 252.44100000000003, "r_x3": 328.781, "r_y3": 252.44100000000003, "coord_origin": "TOPLEFT"}, "text": "3", "orig": "3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[18] Yiren Li, Zheng Huang, Junchi Yan, Yi Zhou, Fan Ye, and Xianhui Liu. Gfte: Graph-based financial table extraction. In Alberto Del Bimbo, Rita Cucchiara, Stan Sclaroff, Giovanni Maria Farinella, Tao Mei, Marco Bertini, Hugo Jair Escalante, and Roberto Vezzani, editors, Pattern Recognition. ICPR International Workshops and Challenges , pages 644-658, Cham, 2021. Springer International Publishing. 2, 3"}, {"label": "list_item", "id": 8, "page_no": 8, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 308.862, "t": 263.88699999999994, "r": 545.114, "b": 326.378, "coord_origin": "TOPLEFT"}, "confidence": 0.937321662902832, "cells": [{"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 271.58399999999995, "r_x1": 323.8, "r_y1": 271.58399999999995, "r_x2": 323.8, "r_y2": 263.88699999999994, "r_x3": 308.862, "r_y3": 263.88699999999994, "coord_origin": "TOPLEFT"}, "text": "[19]", "orig": "[19]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 271.58399999999995, "r_x1": 545.109, "r_y1": 271.58399999999995, "r_x2": 545.109, "r_y2": 263.88699999999994, "r_x3": 328.785, "r_y3": 263.88699999999994, "coord_origin": "TOPLEFT"}, "text": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "orig": "Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Vik-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 282.543, "r_x1": 545.113, "r_y1": 282.543, "r_x2": 545.113, "r_y2": 274.846, "r_x3": 328.781, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "orig": "tor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 293.502, "r_x1": 527.118, "r_y1": 293.502, "r_x2": 527.118, "r_y2": 285.805, "r_x3": 328.781, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar.", "orig": "Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 531.664, "r_y0": 293.502, "r_x1": 545.113, "r_y1": 293.502, "r_x2": 545.113, "r_y2": 285.805, "r_x3": 531.664, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Ro-", "orig": "Ro-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 304.461, "r_x1": 343.549, "r_y1": 304.461, "r_x2": 343.549, "r_y2": 296.764, "r_x3": 328.781, "r_y3": 296.764, "coord_origin": "TOPLEFT"}, "text": "bust", "orig": "bust", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.44, "r_y0": 304.461, "r_x1": 545.113, "r_y1": 304.461, "r_x2": 545.113, "r_y2": 296.764, "r_x3": 347.44, "r_y3": 296.764, "coord_origin": "TOPLEFT"}, "text": "pdf document conversion using recurrent neural net-", "orig": "pdf document conversion using recurrent neural net-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 315.419, "r_x1": 352.847, "r_y1": 315.419, "r_x2": 352.847, "r_y2": 307.722, "r_x3": 328.781, "r_y3": 307.722, "coord_origin": "TOPLEFT"}, "text": "works.", "orig": "works.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.236, "r_y0": 315.29, "r_x1": 545.114, "r_y1": 315.29, "r_x2": 545.114, "r_y2": 307.56, "r_x3": 360.236, "r_y3": 307.56, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the AAAI Conference on Artificial", "orig": "Proceedings of the AAAI Conference on Artificial", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 203, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 326.249, "r_x1": 371.022, "r_y1": 326.249, "r_x2": 371.022, "r_y2": 318.519, "r_x3": 328.781, "r_y3": 318.519, "coord_origin": "TOPLEFT"}, "text": "Intelligence", "orig": "Intelligence", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 204, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 371.021, "r_y0": 326.378, "r_x1": 502.262, "r_y1": 326.378, "r_x2": 502.262, "r_y2": 318.681, "r_x3": 371.021, "r_y3": 318.681, "coord_origin": "TOPLEFT"}, "text": ", 35(17):15137-15145, May 2021. 1", "orig": ", 35(17):15137-15145, May 2021. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[19] Nikolaos Livathinos, Cesar Berrospi, Maksym Lysak, Viktor Kuropiatnyk, Ahmed Nassar, Andre Carvalho, Michele Dolfi, Christoph Auer, Kasper Dinkla, and Peter Staar. Robust pdf document conversion using recurrent neural networks. Proceedings of the AAAI Conference on Artificial Intelligence , 35(17):15137-15145, May 2021. 1"}, {"label": "list_item", "id": 18, "page_no": 8, "cluster": {"id": 18, "label": "list_item", "bbox": {"l": 308.862, "t": 330.127, "r": 545.116, "b": 370.701, "coord_origin": "TOPLEFT"}, "confidence": 0.9027292728424072, "cells": [{"index": 205, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 337.824, "r_x1": 323.8, "r_y1": 337.824, "r_x2": 323.8, "r_y2": 330.127, "r_x3": 308.862, "r_y3": 330.127, "coord_origin": "TOPLEFT"}, "text": "[20]", "orig": "[20]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 206, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 337.824, "r_x1": 545.109, "r_y1": 337.824, "r_x2": 545.109, "r_y2": 330.127, "r_x3": 328.785, "r_y3": 330.127, "coord_origin": "TOPLEFT"}, "text": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "orig": "Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 207, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 348.783, "r_x1": 456.821, "r_y1": 348.783, "r_x2": 456.821, "r_y2": 341.086, "r_x3": 328.781, "r_y3": 341.086, "coord_origin": "TOPLEFT"}, "text": "Yongpan Wang, and Gui-Song Xia.", "orig": "Yongpan Wang, and Gui-Song Xia.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 208, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 460.991, "r_y0": 348.783, "r_x1": 545.113, "r_y1": 348.783, "r_x2": 545.113, "r_y2": 341.086, "r_x3": 460.991, "r_y3": 341.086, "coord_origin": "TOPLEFT"}, "text": "Parsing table structures", "orig": "Parsing table structures", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 209, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 359.742, "r_x1": 370.421, "r_y1": 359.742, "r_x2": 370.421, "r_y2": 352.045, "r_x3": 328.781, "r_y3": 352.045, "coord_origin": "TOPLEFT"}, "text": "in the wild.", "orig": "in the wild.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 210, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 375.308, "r_y0": 359.742, "r_x1": 382.777, "r_y1": 359.742, "r_x2": 382.777, "r_y2": 352.045, "r_x3": 375.308, "r_y3": 352.045, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 211, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 385.541, "r_y0": 359.613, "r_x1": 545.116, "r_y1": 359.613, "r_x2": 545.116, "r_y2": 351.883, "r_x3": 385.541, "r_y3": 351.883, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE/CVF International", "orig": "Proceedings of the IEEE/CVF International", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 212, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 370.572, "r_x1": 443.596, "r_y1": 370.572, "r_x2": 443.596, "r_y2": 362.842, "r_x3": 328.781, "r_y3": 362.842, "coord_origin": "TOPLEFT"}, "text": "Conference on Computer Vision", "orig": "Conference on Computer Vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 213, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 443.594, "r_y0": 370.701, "r_x1": 534.486, "r_y1": 370.701, "r_x2": 534.486, "r_y2": 363.004, "r_x3": 443.594, "r_y3": 363.004, "coord_origin": "TOPLEFT"}, "text": ", pages 944-952, 2021. 2", "orig": ", pages 944-952, 2021. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[20] Rujiao Long, Wen Wang, Nan Xue, Feiyu Gao, Zhibo Yang, Yongpan Wang, and Gui-Song Xia. Parsing table structures in the wild. In Proceedings of the IEEE/CVF International Conference on Computer Vision , pages 944-952, 2021. 2"}, {"label": "list_item", "id": 21, "page_no": 8, "cluster": {"id": 21, "label": "list_item", "bbox": {"l": 308.862, "t": 374.449, "r": 545.113, "b": 436.941, "coord_origin": "TOPLEFT"}, "confidence": 0.882714569568634, "cells": [{"index": 214, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 382.146, "r_x1": 323.8, "r_y1": 382.146, "r_x2": 323.8, "r_y2": 374.449, "r_x3": 308.862, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "[21]", "orig": "[21]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 215, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 382.146, "r_x1": 362.66, "r_y1": 382.146, "r_x2": 362.66, "r_y2": 374.449, "r_x3": 328.785, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Shubham", "orig": "Shubham", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 216, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 368.695, "r_y0": 382.146, "r_x1": 389.613, "r_y1": 382.146, "r_x2": 389.613, "r_y2": 374.449, "r_x3": 368.695, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Singh", "orig": "Singh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 217, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 395.648, "r_y0": 382.146, "r_x1": 424.564, "r_y1": 382.146, "r_x2": 424.564, "r_y2": 374.449, "r_x3": 395.648, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Paliwal,", "orig": "Paliwal,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 218, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.549, "r_y0": 382.146, "r_x1": 488.504, "r_y1": 382.146, "r_x2": 488.504, "r_y2": 374.449, "r_x3": 431.549, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "D Vishwanath,", "orig": "D Vishwanath,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 219, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 495.48, "r_y0": 382.146, "r_x1": 515.412, "r_y1": 382.146, "r_x2": 515.412, "r_y2": 374.449, "r_x3": 495.48, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Rohit", "orig": "Rohit", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 220, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 521.446, "r_y0": 382.146, "r_x1": 545.109, "r_y1": 382.146, "r_x2": 545.109, "r_y2": 374.449, "r_x3": 521.446, "r_y3": 374.449, "coord_origin": "TOPLEFT"}, "text": "Rahul,", "orig": "Rahul,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 221, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 393.105, "r_x1": 460.318, "r_y1": 393.105, "r_x2": 460.318, "r_y2": 385.408, "r_x3": 328.781, "r_y3": 385.408, "coord_origin": "TOPLEFT"}, "text": "Monika Sharma, and Lovekesh Vig.", "orig": "Monika Sharma, and Lovekesh Vig.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 222, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.393, "r_y0": 393.105, "r_x1": 498.542, "r_y1": 393.105, "r_x2": 498.542, "r_y2": 385.408, "r_x3": 465.393, "r_y3": 385.408, "coord_origin": "TOPLEFT"}, "text": "Tablenet:", "orig": "Tablenet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 223, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 502.469, "r_y0": 393.105, "r_x1": 545.113, "r_y1": 393.105, "r_x2": 545.113, "r_y2": 385.408, "r_x3": 502.469, "r_y3": 385.408, "coord_origin": "TOPLEFT"}, "text": "Deep learn-", "orig": "Deep learn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 224, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 404.064, "r_x1": 545.113, "r_y1": 404.064, "r_x2": 545.113, "r_y2": 396.367, "r_x3": 328.781, "r_y3": 396.367, "coord_origin": "TOPLEFT"}, "text": "ing model for end-to-end table detection and tabular data ex-", "orig": "ing model for end-to-end table detection and tabular data ex-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 225, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 415.023, "r_x1": 478.009, "r_y1": 415.023, "r_x2": 478.009, "r_y2": 407.326, "r_x3": 328.781, "r_y3": 407.326, "coord_origin": "TOPLEFT"}, "text": "traction from scanned document images.", "orig": "traction from scanned document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 226, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 484.07, "r_y0": 415.023, "r_x1": 491.539, "r_y1": 415.023, "r_x2": 491.539, "r_y2": 407.326, "r_x3": 484.07, "r_y3": 407.326, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 227, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 494.668, "r_y0": 414.894, "r_x1": 545.113, "r_y1": 414.894, "r_x2": 545.113, "r_y2": 407.164, "r_x3": 494.668, "r_y3": 407.164, "coord_origin": "TOPLEFT"}, "text": "2019 Interna-", "orig": "2019 Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 228, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 425.853, "r_x1": 349.709, "r_y1": 425.853, "r_x2": 349.709, "r_y2": 418.123, "r_x3": 328.781, "r_y3": 418.123, "coord_origin": "TOPLEFT"}, "text": "tional", "orig": "tional", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 229, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 353.295, "r_y0": 425.853, "r_x1": 545.113, "r_y1": 425.853, "r_x2": 545.113, "r_y2": 418.123, "r_x3": 353.295, "r_y3": 418.123, "coord_origin": "TOPLEFT"}, "text": "Conference on Document Analysis and Recognition", "orig": "Conference on Document Analysis and Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 230, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 436.812, "r_x1": 360.836, "r_y1": 436.812, "r_x2": 360.836, "r_y2": 429.082, "r_x3": 328.781, "r_y3": 429.082, "coord_origin": "TOPLEFT"}, "text": "(ICDAR)", "orig": "(ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 231, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 360.836, "r_y0": 436.941, "r_x1": 475.633, "r_y1": 436.941, "r_x2": 475.633, "r_y2": 429.244, "r_x3": 360.836, "r_y3": 429.244, "coord_origin": "TOPLEFT"}, "text": ", pages 128-133. IEEE, 2019. 1", "orig": ", pages 128-133. IEEE, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[21] Shubham Singh Paliwal, D Vishwanath, Rohit Rahul, Monika Sharma, and Lovekesh Vig. Tablenet: Deep learning model for end-to-end table detection and tabular data extraction from scanned document images. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 128-133. IEEE, 2019. 1"}, {"label": "list_item", "id": 20, "page_no": 8, "cluster": {"id": 20, "label": "list_item", "bbox": {"l": 308.862, "t": 440.689, "r": 545.115, "b": 557.975, "coord_origin": "TOPLEFT"}, "confidence": 0.8896440863609314, "cells": [{"index": 232, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 448.386, "r_x1": 323.8, "r_y1": 448.386, "r_x2": 323.8, "r_y2": 440.689, "r_x3": 308.862, "r_y3": 440.689, "coord_origin": "TOPLEFT"}, "text": "[22]", "orig": "[22]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 233, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 448.386, "r_x1": 545.109, "r_y1": 448.386, "r_x2": 545.109, "r_y2": 440.689, "r_x3": 328.785, "r_y3": 440.689, "coord_origin": "TOPLEFT"}, "text": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "orig": "Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 234, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 459.345, "r_x1": 545.113, "r_y1": 459.345, "r_x2": 545.113, "r_y2": 451.648, "r_x3": 328.781, "r_y3": 451.648, "coord_origin": "TOPLEFT"}, "text": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "orig": "James Bradbury, Gregory Chanan, Trevor Killeen, Zeming", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 235, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 470.304, "r_x1": 343.477, "r_y1": 470.304, "r_x2": 343.477, "r_y2": 462.607, "r_x3": 328.781, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Lin,", "orig": "Lin,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 236, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 347.601, "r_y0": 470.304, "r_x1": 373.496, "r_y1": 470.304, "r_x2": 373.496, "r_y2": 462.607, "r_x3": 347.601, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Natalia", "orig": "Natalia", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 237, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 377.244, "r_y0": 470.304, "r_x1": 420.83, "r_y1": 470.304, "r_x2": 420.83, "r_y2": 462.607, "r_x3": 377.244, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Gimelshein,", "orig": "Gimelshein,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 238, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.955, "r_y0": 470.304, "r_x1": 473.239, "r_y1": 470.304, "r_x2": 473.239, "r_y2": 462.607, "r_x3": 424.955, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Luca Antiga,", "orig": "Luca Antiga,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 239, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 477.363, "r_y0": 470.304, "r_x1": 545.113, "r_y1": 470.304, "r_x2": 545.113, "r_y2": 462.607, "r_x3": 477.363, "r_y3": 462.607, "coord_origin": "TOPLEFT"}, "text": "Alban Desmaison,", "orig": "Alban Desmaison,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 240, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 481.263, "r_x1": 545.113, "r_y1": 481.263, "r_x2": 545.113, "r_y2": 473.566, "r_x3": 328.781, "r_y3": 473.566, "coord_origin": "TOPLEFT"}, "text": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "orig": "Andreas Kopf, Edward Yang, Zachary DeVito, Martin Rai-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 241, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 492.222, "r_x1": 545.113, "r_y1": 492.222, "r_x2": 545.113, "r_y2": 484.525, "r_x3": 328.781, "r_y3": 484.525, "coord_origin": "TOPLEFT"}, "text": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "orig": "son, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 242, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 503.181, "r_x1": 545.113, "r_y1": 503.181, "r_x2": 545.113, "r_y2": 495.484, "r_x3": 328.781, "r_y3": 495.484, "coord_origin": "TOPLEFT"}, "text": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "orig": "Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 243, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 514.14, "r_x1": 545.113, "r_y1": 514.14, "r_x2": 545.113, "r_y2": 506.443, "r_x3": 328.781, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "perative style, high-performance deep learning library. In H.", "orig": "perative style, high-performance deep learning library. In H.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 244, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 525.0989999999999, "r_x1": 545.11, "r_y1": 525.0989999999999, "r_x2": 545.11, "r_y2": 517.402, "r_x3": 328.781, "r_y3": 517.402, "coord_origin": "TOPLEFT"}, "text": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4-Buc, E.", "orig": "Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4-Buc, E.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 245, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 511.145, "r_y0": 525.0989999999999, "r_x1": 515.126, "r_y1": 525.0989999999999, "r_x2": 515.126, "r_y2": 517.402, "r_x3": 511.145, "r_y3": 517.402, "coord_origin": "TOPLEFT"}, "text": "e", "orig": "e", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 246, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 536.057, "r_x1": 434.567, "r_y1": 536.057, "r_x2": 434.567, "r_y2": 528.36, "r_x3": 328.781, "r_y3": 528.36, "coord_origin": "TOPLEFT"}, "text": "Fox, and R. Garnett, editors,", "orig": "Fox, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 247, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 437.864, "r_y0": 535.928, "r_x1": 545.111, "r_y1": 535.928, "r_x2": 545.111, "r_y2": 528.198, "r_x3": 437.864, "r_y3": 528.198, "coord_origin": "TOPLEFT"}, "text": "Advances in Neural Informa-", "orig": "Advances in Neural Informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 248, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 546.887, "r_x1": 425.735, "r_y1": 546.887, "r_x2": 425.735, "r_y2": 539.157, "r_x3": 328.781, "r_y3": 539.157, "coord_origin": "TOPLEFT"}, "text": "tion Processing Systems 32", "orig": "tion Processing Systems 32", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 249, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 425.736, "r_y0": 547.016, "r_x1": 545.115, "r_y1": 547.016, "r_x2": 545.115, "r_y2": 539.319, "r_x3": 425.736, "r_y3": 539.319, "coord_origin": "TOPLEFT"}, "text": ", pages 8024-8035. Curran Asso-", "orig": ", pages 8024-8035. Curran Asso-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 250, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 557.975, "r_x1": 399.741, "r_y1": 557.975, "r_x2": 399.741, "r_y2": 550.278, "r_x3": 328.781, "r_y3": 550.278, "coord_origin": "TOPLEFT"}, "text": "ciates, Inc., 2019. 6", "orig": "ciates, Inc., 2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[22] Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer, James Bradbury, Gregory Chanan, Trevor Killeen, Zeming Lin, Natalia Gimelshein, Luca Antiga, Alban Desmaison, Andreas Kopf, Edward Yang, Zachary DeVito, Martin Raison, Alykhan Tejani, Sasank Chilamkurthy, Benoit Steiner, Lu Fang, Junjie Bai, and Soumith Chintala. Pytorch: An imperative style, high-performance deep learning library. In H. Wallach, H. Larochelle, A. Beygelzimer, F. d'Alch\u00b4-Buc, E. e Fox, and R. Garnett, editors, Advances in Neural Information Processing Systems 32 , pages 8024-8035. Curran Associates, Inc., 2019. 6"}, {"label": "list_item", "id": 19, "page_no": 8, "cluster": {"id": 19, "label": "list_item", "bbox": {"l": 308.862, "t": 561.7239999999999, "r": 545.113, "b": 624.215, "coord_origin": "TOPLEFT"}, "confidence": 0.9025435447692871, "cells": [{"index": 251, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 569.421, "r_x1": 323.8, "r_y1": 569.421, "r_x2": 323.8, "r_y2": 561.7239999999999, "r_x3": 308.862, "r_y3": 561.7239999999999, "coord_origin": "TOPLEFT"}, "text": "[23]", "orig": "[23]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 252, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 569.421, "r_x1": 395.433, "r_y1": 569.421, "r_x2": 395.433, "r_y2": 561.7239999999999, "r_x3": 328.785, "r_y3": 561.7239999999999, "coord_origin": "TOPLEFT"}, "text": "Devashish Prasad,", "orig": "Devashish Prasad,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 253, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 399.369, "r_y0": 569.421, "r_x1": 545.109, "r_y1": 569.421, "r_x2": 545.109, "r_y2": 561.7239999999999, "r_x3": 399.369, "r_y3": 561.7239999999999, "coord_origin": "TOPLEFT"}, "text": "Ayan Gadpal, Kshitij Kapadni, Manish", "orig": "Ayan Gadpal, Kshitij Kapadni, Manish", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 254, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 580.38, "r_x1": 545.113, "r_y1": 580.38, "r_x2": 545.113, "r_y2": 572.683, "r_x3": 328.781, "r_y3": 572.683, "coord_origin": "TOPLEFT"}, "text": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "orig": "Visave, and Kavita Sultanpure. Cascadetabnet: An approach", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 255, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 591.3389999999999, "r_x1": 545.113, "r_y1": 591.3389999999999, "r_x2": 545.113, "r_y2": 583.642, "r_x3": 328.781, "r_y3": 583.642, "coord_origin": "TOPLEFT"}, "text": "for end to end table detection and structure recognition from", "orig": "for end to end table detection and structure recognition from", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 256, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 602.298, "r_x1": 418.266, "r_y1": 602.298, "r_x2": 418.266, "r_y2": 594.601, "r_x3": 328.781, "r_y3": 594.601, "coord_origin": "TOPLEFT"}, "text": "image-based documents.", "orig": "image-based documents.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 257, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 424.148, "r_y0": 602.298, "r_x1": 431.617, "r_y1": 602.298, "r_x2": 431.617, "r_y2": 594.601, "r_x3": 424.148, "r_y3": 594.601, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 258, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 434.691, "r_y0": 602.169, "r_x1": 545.112, "r_y1": 602.169, "r_x2": 545.112, "r_y2": 594.439, "r_x3": 434.691, "r_y3": 594.439, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE/CVF", "orig": "Proceedings of the IEEE/CVF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 259, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 613.127, "r_x1": 369.784, "r_y1": 613.127, "r_x2": 369.784, "r_y2": 605.3969999999999, "r_x3": 328.781, "r_y3": 605.3969999999999, "coord_origin": "TOPLEFT"}, "text": "Conference", "orig": "Conference", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 260, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 374.008, "r_y0": 613.127, "r_x1": 449.549, "r_y1": 613.127, "r_x2": 449.549, "r_y2": 605.3969999999999, "r_x3": 374.008, "r_y3": 605.3969999999999, "coord_origin": "TOPLEFT"}, "text": "on Computer Vision", "orig": "on Computer Vision", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 261, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 453.782, "r_y0": 613.127, "r_x1": 497.636, "r_y1": 613.127, "r_x2": 497.636, "r_y2": 605.3969999999999, "r_x3": 453.782, "r_y3": 605.3969999999999, "coord_origin": "TOPLEFT"}, "text": "and Pattern", "orig": "and Pattern", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 262, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 501.868, "r_y0": 613.127, "r_x1": 545.113, "r_y1": 613.127, "r_x2": 545.113, "r_y2": 605.3969999999999, "r_x3": 501.868, "r_y3": 605.3969999999999, "coord_origin": "TOPLEFT"}, "text": "Recognition", "orig": "Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 263, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 624.086, "r_x1": 367.803, "r_y1": 624.086, "r_x2": 367.803, "r_y2": 616.356, "r_x3": 328.781, "r_y3": 616.356, "coord_origin": "TOPLEFT"}, "text": "Workshops", "orig": "Workshops", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 264, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 367.802, "r_y0": 624.215, "r_x1": 458.694, "r_y1": 624.215, "r_x2": 458.694, "r_y2": 616.518, "r_x3": 367.802, "r_y3": 616.518, "coord_origin": "TOPLEFT"}, "text": ", pages 572-573, 2020. 1", "orig": ", pages 572-573, 2020. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[23] Devashish Prasad, Ayan Gadpal, Kshitij Kapadni, Manish Visave, and Kavita Sultanpure. Cascadetabnet: An approach for end to end table detection and structure recognition from image-based documents. In Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition Workshops , pages 572-573, 2020. 1"}, {"label": "list_item", "id": 23, "page_no": 8, "cluster": {"id": 23, "label": "list_item", "bbox": {"l": 308.862, "t": 627.9639999999999, "r": 545.116, "b": 668.538, "coord_origin": "TOPLEFT"}, "confidence": 0.8777532577514648, "cells": [{"index": 265, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 635.6610000000001, "r_x1": 323.8, "r_y1": 635.6610000000001, "r_x2": 323.8, "r_y2": 627.9639999999999, "r_x3": 308.862, "r_y3": 627.9639999999999, "coord_origin": "TOPLEFT"}, "text": "[24]", "orig": "[24]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 266, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 635.6610000000001, "r_x1": 545.109, "r_y1": 635.6610000000001, "r_x2": 545.109, "r_y2": 627.9639999999999, "r_x3": 328.785, "r_y3": 627.9639999999999, "coord_origin": "TOPLEFT"}, "text": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "orig": "Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 267, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 646.62, "r_x1": 545.113, "r_y1": 646.62, "r_x2": 545.113, "r_y2": 638.923, "r_x3": 328.781, "r_y3": 638.923, "coord_origin": "TOPLEFT"}, "text": "Rethinking table recognition using graph neural networks.", "orig": "Rethinking table recognition using graph neural networks.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 268, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 657.579, "r_x1": 336.25, "r_y1": 657.579, "r_x2": 336.25, "r_y2": 649.8820000000001, "r_x3": 328.781, "r_y3": 649.8820000000001, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 269, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.1, "r_y0": 657.45, "r_x1": 545.116, "r_y1": 657.45, "r_x2": 545.116, "r_y2": 649.72, "r_x3": 338.1, "r_y3": 649.72, "coord_origin": "TOPLEFT"}, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 270, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 668.409, "r_x1": 406.322, "r_y1": 668.409, "r_x2": 406.322, "r_y2": 660.679, "r_x3": 328.781, "r_y3": 660.679, "coord_origin": "TOPLEFT"}, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 271, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 406.322, "r_y0": 668.538, "r_x1": 521.119, "r_y1": 668.538, "r_x2": 521.119, "r_y2": 660.841, "r_x3": 406.322, "r_y3": 660.841, "coord_origin": "TOPLEFT"}, "text": ", pages 142-147. IEEE, 2019. 3", "orig": ", pages 142-147. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[24] Shah Rukh Qasim, Hassan Mahmood, and Faisal Shafait. Rethinking table recognition using graph neural networks. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 142-147. IEEE, 2019. 3"}, {"label": "list_item", "id": 24, "page_no": 8, "cluster": {"id": 24, "label": "list_item", "bbox": {"l": 308.862, "t": 672.2860000000001, "r": 545.113, "b": 712.86, "coord_origin": "TOPLEFT"}, "confidence": 0.8654531240463257, "cells": [{"index": 272, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 679.983, "r_x1": 323.8, "r_y1": 679.983, "r_x2": 323.8, "r_y2": 672.2860000000001, "r_x3": 308.862, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "[25]", "orig": "[25]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 273, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 679.983, "r_x1": 400.857, "r_y1": 679.983, "r_x2": 400.857, "r_y2": 672.2860000000001, "r_x3": 328.785, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "Hamid Rezatofighi,", "orig": "Hamid Rezatofighi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 274, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 405.403, "r_y0": 679.983, "r_x1": 453.571, "r_y1": 679.983, "r_x2": 453.571, "r_y2": 672.2860000000001, "r_x3": 405.403, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "Nathan Tsoi,", "orig": "Nathan Tsoi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 275, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 458.117, "r_y0": 679.983, "r_x1": 521.635, "r_y1": 679.983, "r_x2": 521.635, "r_y2": 672.2860000000001, "r_x3": 458.117, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "JunYoung Gwak,", "orig": "JunYoung Gwak,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 276, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 526.181, "r_y0": 679.983, "r_x1": 545.109, "r_y1": 679.983, "r_x2": 545.109, "r_y2": 672.2860000000001, "r_x3": 526.181, "r_y3": 672.2860000000001, "coord_origin": "TOPLEFT"}, "text": "Amir", "orig": "Amir", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 277, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 690.942, "r_x1": 482.815, "r_y1": 690.942, "r_x2": 482.815, "r_y2": 683.245, "r_x3": 328.781, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "Sadeghian, Ian Reid, and Silvio Savarese.", "orig": "Sadeghian, Ian Reid, and Silvio Savarese.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 278, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.751, "r_y0": 690.942, "r_x1": 545.113, "r_y1": 690.942, "r_x2": 545.113, "r_y2": 683.245, "r_x3": 488.751, "r_y3": 683.245, "coord_origin": "TOPLEFT"}, "text": "Generalized in-", "orig": "Generalized in-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 279, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 701.901, "r_x1": 545.113, "r_y1": 701.901, "r_x2": 545.113, "r_y2": 694.204, "r_x3": 328.781, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "tersection over union: A metric and a loss for bounding box", "orig": "tersection over union: A metric and a loss for bounding box", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 280, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 712.86, "r_x1": 367.74, "r_y1": 712.86, "r_x2": 367.74, "r_y2": 705.163, "r_x3": 328.781, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "regression.", "orig": "regression.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 281, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 371.685, "r_y0": 712.86, "r_x1": 379.154, "r_y1": 712.86, "r_x2": 379.154, "r_y2": 705.163, "r_x3": 371.685, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 282, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 381.616, "r_y0": 712.731, "r_x1": 545.109, "r_y1": 712.731, "r_x2": 545.109, "r_y2": 705.001, "r_x3": 381.616, "r_y3": 705.001, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE/CVF Conference on", "orig": "Proceedings of the IEEE/CVF Conference on", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[25] Hamid Rezatofighi, Nathan Tsoi, JunYoung Gwak, Amir Sadeghian, Ian Reid, and Silvio Savarese. Generalized intersection over union: A metric and a loss for bounding box regression. In Proceedings of the IEEE/CVF Conference on"}], "headers": [{"label": "page_footer", "id": 22, "page_no": 8, "cluster": {"id": 22, "label": "page_footer", "bbox": {"l": 295.121, "t": 734.402, "r": 300.102, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8797808885574341, "cells": [{"index": 283, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 295.121, "r_y0": 742.954, "r_x1": 300.102, "r_y1": 742.954, "r_x2": 300.102, "r_y2": 734.402, "r_x3": 295.121, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "9", "orig": "9", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9"}]}}, {"page_no": 9, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 83.69399999999996, "r_x1": 223.581, "r_y1": 83.69399999999996, "r_x2": 223.581, "r_y2": 75.96400000000006, "r_x3": 70.031, "r_y3": 75.96400000000006, "coord_origin": "TOPLEFT"}, "text": "Computer Vision and Pattern Recognition", "orig": "Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 223.579, "r_y0": 83.82299999999998, "r_x1": 225.821, "r_y1": 83.82299999999998, "r_x2": 225.821, "r_y2": 76.12599999999998, "r_x3": 223.579, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.183, "r_y0": 83.82299999999998, "r_x1": 286.362, "r_y1": 83.82299999999998, "r_x2": 286.362, "r_y2": 76.12599999999998, "r_x3": 229.183, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "pages 658-666,", "orig": "pages 658-666,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 94.78200000000004, "r_x1": 97.917, "r_y1": 94.78200000000004, "r_x2": 97.917, "r_y2": 87.08500000000004, "r_x3": 70.031, "r_y3": 87.08500000000004, "coord_origin": "TOPLEFT"}, "text": "2019. 6", "orig": "2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 106.10500000000002, "r_x1": 65.05, "r_y1": 106.10500000000002, "r_x2": 65.05, "r_y2": 98.40800000000002, "r_x3": 50.112, "r_y3": 98.40800000000002, "coord_origin": "TOPLEFT"}, "text": "[26]", "orig": "[26]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 106.10500000000002, "r_x1": 286.359, "r_y1": 106.10500000000002, "r_x2": 286.359, "r_y2": 98.40800000000002, "r_x3": 70.035, "r_y3": 98.40800000000002, "coord_origin": "TOPLEFT"}, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 117.06399999999996, "r_x1": 286.363, "r_y1": 117.06399999999996, "r_x2": 286.363, "r_y2": 109.36699999999996, "r_x3": 70.031, "r_y3": 109.36699999999996, "coord_origin": "TOPLEFT"}, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 128.02300000000002, "r_x1": 286.363, "r_y1": 128.02300000000002, "r_x2": 286.363, "r_y2": 120.32600000000002, "r_x3": 70.031, "r_y3": 120.32600000000002, "coord_origin": "TOPLEFT"}, "text": "tion and structure recognition of tables in document images.", "orig": "tion and structure recognition of tables in document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 138.98199999999997, "r_x1": 77.5, "r_y1": 138.98199999999997, "r_x2": 77.5, "r_y2": 131.28499999999997, "r_x3": 70.031, "r_y3": 131.28499999999997, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 80.56, "r_y0": 138.85299999999995, "r_x1": 286.366, "r_y1": 138.85299999999995, "r_x2": 286.366, "r_y2": 131.12300000000005, "r_x3": 80.56, "r_y3": 131.12300000000005, "coord_origin": "TOPLEFT"}, "text": "2017 14th IAPR International Conference on Document", "orig": "2017 14th IAPR International Conference on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 149.812, "r_x1": 195.229, "r_y1": 149.812, "r_x2": 195.229, "r_y2": 142.082, "r_x3": 70.031, "r_y3": 142.082, "coord_origin": "TOPLEFT"}, "text": "Analysis and Recognition (ICDAR)", "orig": "Analysis and Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.231, "r_y0": 149.94100000000003, "r_x1": 286.365, "r_y1": 149.94100000000003, "r_x2": 286.365, "r_y2": 142.24400000000003, "r_x3": 195.231, "r_y3": 142.24400000000003, "coord_origin": "TOPLEFT"}, "text": ", volume 01, pages 1162-", "orig": ", volume 01, pages 1162-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 160.89999999999998, "r_x1": 120.333, "r_y1": 160.89999999999998, "r_x2": 120.333, "r_y2": 153.20299999999997, "r_x3": 70.031, "r_y3": 153.20299999999997, "coord_origin": "TOPLEFT"}, "text": "1167, 2017. 1", "orig": "1167, 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 172.22400000000005, "r_x1": 65.05, "r_y1": 172.22400000000005, "r_x2": 65.05, "r_y2": 164.52700000000004, "r_x3": 50.112, "r_y3": 164.52700000000004, "coord_origin": "TOPLEFT"}, "text": "[27]", "orig": "[27]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 172.22400000000005, "r_x1": 286.359, "r_y1": 172.22400000000005, "r_x2": 286.359, "r_y2": 164.52700000000004, "r_x3": 70.035, "r_y3": 164.52700000000004, "coord_origin": "TOPLEFT"}, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 183.183, "r_x1": 158.395, "r_y1": 183.183, "r_x2": 158.395, "r_y2": 175.486, "r_x3": 70.031, "r_y3": 175.486, "coord_origin": "TOPLEFT"}, "text": "gel, and Sheraz Ahmed.", "orig": "gel, and Sheraz Ahmed.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.035, "r_y0": 183.183, "r_x1": 202.877, "r_y1": 183.183, "r_x2": 202.877, "r_y2": 175.486, "r_x3": 164.035, "r_y3": 175.486, "coord_origin": "TOPLEFT"}, "text": "Deepdesrt:", "orig": "Deepdesrt:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.163, "r_y0": 183.183, "r_x1": 286.363, "r_y1": 183.183, "r_x2": 286.363, "r_y2": 175.486, "r_x3": 207.163, "r_y3": 175.486, "coord_origin": "TOPLEFT"}, "text": "Deep learning for de-", "orig": "Deep learning for de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 194.14200000000005, "r_x1": 286.363, "r_y1": 194.14200000000005, "r_x2": 286.363, "r_y2": 186.44500000000005, "r_x3": 70.031, "r_y3": 186.44500000000005, "coord_origin": "TOPLEFT"}, "text": "tection and structure recognition of tables in document im-", "orig": "tection and structure recognition of tables in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 205.101, "r_x1": 88.206, "r_y1": 205.101, "r_x2": 88.206, "r_y2": 197.404, "r_x3": 70.031, "r_y3": 197.404, "coord_origin": "TOPLEFT"}, "text": "ages.", "orig": "ages.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.864, "r_y0": 205.101, "r_x1": 101.333, "r_y1": 205.101, "r_x2": 101.333, "r_y2": 197.404, "r_x3": 93.864, "r_y3": 197.404, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 104.331, "r_y0": 204.97199999999998, "r_x1": 286.358, "r_y1": 204.97199999999998, "r_x2": 286.358, "r_y2": 197.24199999999996, "r_x3": 104.331, "r_y3": 197.24199999999996, "coord_origin": "TOPLEFT"}, "text": "2017 14th IAPR international conference on doc-", "orig": "2017 14th IAPR international conference on doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 215.92999999999995, "r_x1": 220.487, "r_y1": 215.92999999999995, "r_x2": 220.487, "r_y2": 208.20000000000005, "r_x3": 70.031, "r_y3": 208.20000000000005, "coord_origin": "TOPLEFT"}, "text": "ument analysis and recognition (ICDAR)", "orig": "ument analysis and recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.484, "r_y0": 216.05899999999997, "r_x1": 222.726, "r_y1": 216.05899999999997, "r_x2": 222.726, "r_y2": 208.36199999999997, "r_x3": 220.484, "r_y3": 208.36199999999997, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 225.909, "r_y0": 216.05899999999997, "r_x1": 286.36, "r_y1": 216.05899999999997, "r_x2": 286.36, "r_y2": 208.36199999999997, "r_x3": 225.909, "r_y3": 208.36199999999997, "coord_origin": "TOPLEFT"}, "text": "volume 1, pages", "orig": "volume 1, pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 227.01800000000003, "r_x1": 166.653, "r_y1": 227.01800000000003, "r_x2": 166.653, "r_y2": 219.32100000000003, "r_x3": 70.031, "r_y3": 219.32100000000003, "coord_origin": "TOPLEFT"}, "text": "1162-1167. IEEE, 2017. 3", "orig": "1162-1167. IEEE, 2017. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 238.34199999999998, "r_x1": 65.05, "r_y1": 238.34199999999998, "r_x2": 65.05, "r_y2": 230.64499999999998, "r_x3": 50.112, "r_y3": 230.64499999999998, "coord_origin": "TOPLEFT"}, "text": "[28]", "orig": "[28]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 238.34199999999998, "r_x1": 179.147, "r_y1": 238.34199999999998, "r_x2": 179.147, "r_y2": 230.64499999999998, "r_x3": 70.035, "r_y3": 230.64499999999998, "coord_origin": "TOPLEFT"}, "text": "Faisal Shafait and Ray Smith.", "orig": "Faisal Shafait and Ray Smith.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.366, "r_y0": 238.34199999999998, "r_x1": 286.359, "r_y1": 238.34199999999998, "r_x2": 286.359, "r_y2": 230.64499999999998, "r_x3": 184.366, "r_y3": 230.64499999999998, "coord_origin": "TOPLEFT"}, "text": "Table detection in heteroge-", "orig": "Table detection in heteroge-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 249.30100000000004, "r_x1": 134.804, "r_y1": 249.30100000000004, "r_x2": 134.804, "r_y2": 241.60400000000004, "r_x3": 70.031, "r_y3": 241.60400000000004, "coord_origin": "TOPLEFT"}, "text": "neous documents.", "orig": "neous documents.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.7, "r_y0": 249.30100000000004, "r_x1": 147.169, "r_y1": 249.30100000000004, "r_x2": 147.169, "r_y2": 241.60400000000004, "r_x3": 139.7, "r_y3": 241.60400000000004, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.933, "r_y0": 249.17200000000003, "r_x1": 286.366, "r_y1": 249.17200000000003, "r_x2": 286.366, "r_y2": 241.442, "r_x3": 149.933, "r_y3": 241.442, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the 9th IAPR Interna-", "orig": "Proceedings of the 9th IAPR Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 260.131, "r_x1": 244.688, "r_y1": 260.131, "r_x2": 244.688, "r_y2": 252.40099999999995, "r_x3": 70.031, "r_y3": 252.40099999999995, "coord_origin": "TOPLEFT"}, "text": "tional Workshop on Document Analysis Systems", "orig": "tional Workshop on Document Analysis Systems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 244.691, "r_y0": 260.26, "r_x1": 246.933, "r_y1": 260.26, "r_x2": 246.933, "r_y2": 252.563, "r_x3": 244.691, "r_y3": 252.563, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.775, "r_y0": 260.26, "r_x1": 286.358, "r_y1": 260.26, "r_x2": 286.358, "r_y2": 252.563, "r_x3": 249.775, "r_y3": 252.563, "coord_origin": "TOPLEFT"}, "text": "pages 65-", "orig": "pages 65-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 271.21900000000005, "r_x1": 111.366, "r_y1": 271.21900000000005, "r_x2": 111.366, "r_y2": 263.52200000000005, "r_x3": 70.031, "r_y3": 263.52200000000005, "coord_origin": "TOPLEFT"}, "text": "72, 2010. 2", "orig": "72, 2010. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 282.543, "r_x1": 65.05, "r_y1": 282.543, "r_x2": 65.05, "r_y2": 274.846, "r_x3": 50.112, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "[29]", "orig": "[29]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 282.543, "r_x1": 94.944, "r_y1": 282.543, "r_x2": 94.944, "r_y2": 274.846, "r_x3": 70.035, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Shoaib", "orig": "Shoaib", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 100.871, "r_y0": 282.543, "r_x1": 127.268, "r_y1": 282.543, "r_x2": 127.268, "r_y2": 274.846, "r_x3": 100.871, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Ahmed", "orig": "Ahmed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 133.195, "r_y0": 282.543, "r_x1": 165.832, "r_y1": 282.543, "r_x2": 165.832, "r_y2": 274.846, "r_x3": 133.195, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Siddiqui,", "orig": "Siddiqui,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.683, "r_y0": 282.543, "r_x1": 194.094, "r_y1": 282.543, "r_x2": 194.094, "r_y2": 274.846, "r_x3": 172.683, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Imran", "orig": "Imran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.021, "r_y0": 282.543, "r_x1": 211.48, "r_y1": 282.543, "r_x2": 211.48, "r_y2": 274.846, "r_x3": 200.021, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Ali", "orig": "Ali", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.407, "r_y0": 282.543, "r_x1": 239.438, "r_y1": 282.543, "r_x2": 239.438, "r_y2": 274.846, "r_x3": 217.407, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Fateh,", "orig": "Fateh,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.288, "r_y0": 282.543, "r_x1": 264.221, "r_y1": 282.543, "r_x2": 264.221, "r_y2": 274.846, "r_x3": 246.288, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Syed", "orig": "Syed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.147, "r_y0": 282.543, "r_x1": 286.359, "r_y1": 282.543, "r_x2": 286.359, "r_y2": 274.846, "r_x3": 270.147, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Tah-", "orig": "Tah-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 293.502, "r_x1": 85.964, "r_y1": 293.502, "r_x2": 85.964, "r_y2": 285.805, "r_x3": 70.031, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "seen", "orig": "seen", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.021, "r_y0": 293.502, "r_x1": 108.945, "r_y1": 293.502, "r_x2": 108.945, "r_y2": 285.805, "r_x3": 91.021, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Raza", "orig": "Raza", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 114.002, "r_y0": 293.502, "r_x1": 135.674, "r_y1": 293.502, "r_x2": 135.674, "r_y2": 285.805, "r_x3": 114.002, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Rizvi,", "orig": "Rizvi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.43, "r_y0": 293.502, "r_x1": 171.306, "r_y1": 293.502, "r_x2": 171.306, "r_y2": 285.805, "r_x3": 141.43, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Andreas", "orig": "Andreas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.364, "r_y0": 293.502, "r_x1": 204.5, "r_y1": 293.502, "r_x2": 204.5, "r_y2": 285.805, "r_x3": 176.364, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Dengel,", "orig": "Dengel,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.265, "r_y0": 293.502, "r_x1": 223.213, "r_y1": 293.502, "r_x2": 223.213, "r_y2": 285.805, "r_x3": 210.265, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.27, "r_y0": 293.502, "r_x1": 252.668, "r_y1": 293.502, "r_x2": 252.668, "r_y2": 285.805, "r_x3": 228.27, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Sheraz", "orig": "Sheraz", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.725, "r_y0": 293.502, "r_x1": 286.363, "r_y1": 293.502, "r_x2": 286.363, "r_y2": 285.805, "r_x3": 257.725, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Ahmed.", "orig": "Ahmed.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 304.461, "r_x1": 286.363, "r_y1": 304.461, "r_x2": 286.363, "r_y2": 296.764, "r_x3": 70.031, "r_y3": 296.764, "coord_origin": "TOPLEFT"}, "text": "Deeptabstr: Deep learning based table structure recognition.", "orig": "Deeptabstr: Deep learning based table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 315.42, "r_x1": 77.5, "r_y1": 315.42, "r_x2": 77.5, "r_y2": 307.723, "r_x3": 70.031, "r_y3": 307.723, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 79.35, "r_y0": 315.291, "r_x1": 286.366, "r_y1": 315.291, "r_x2": 286.366, "r_y2": 307.561, "r_x3": 79.35, "r_y3": 307.561, "coord_origin": "TOPLEFT"}, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 326.249, "r_x1": 147.572, "r_y1": 326.249, "r_x2": 147.572, "r_y2": 318.519, "r_x3": 70.031, "r_y3": 318.519, "coord_origin": "TOPLEFT"}, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.572, "r_y0": 326.378, "r_x1": 271.335, "r_y1": 326.378, "r_x2": 271.335, "r_y2": 318.681, "r_x3": 147.572, "r_y3": 318.681, "coord_origin": "TOPLEFT"}, "text": ", pages 1403-1409. IEEE, 2019. 3", "orig": ", pages 1403-1409. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 337.702, "r_x1": 65.05, "r_y1": 337.702, "r_x2": 65.05, "r_y2": 330.005, "r_x3": 50.112, "r_y3": 330.005, "coord_origin": "TOPLEFT"}, "text": "[30]", "orig": "[30]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 337.702, "r_x1": 286.359, "r_y1": 337.702, "r_x2": 286.359, "r_y2": 330.005, "r_x3": 70.035, "r_y3": 330.005, "coord_origin": "TOPLEFT"}, "text": "Peter WJ Staar, Michele Dolfi, Christoph Auer, and Costas", "orig": "Peter WJ Staar, Michele Dolfi, Christoph Auer, and Costas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 348.661, "r_x1": 286.363, "r_y1": 348.661, "r_x2": 286.363, "r_y2": 340.964, "r_x3": 70.031, "r_y3": 340.964, "coord_origin": "TOPLEFT"}, "text": "Bekas. Corpus conversion service: A machine learning plat-", "orig": "Bekas. Corpus conversion service: A machine learning plat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 359.62, "r_x1": 198.824, "r_y1": 359.62, "r_x2": 198.824, "r_y2": 351.923, "r_x3": 70.031, "r_y3": 351.923, "coord_origin": "TOPLEFT"}, "text": "form to ingest documents at scale.", "orig": "form to ingest documents at scale.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.06, "r_y0": 359.62, "r_x1": 213.529, "r_y1": 359.62, "r_x2": 213.529, "r_y2": 351.923, "r_x3": 206.06, "r_y3": 351.923, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.021, "r_y0": 359.491, "r_x1": 286.358, "r_y1": 359.491, "r_x2": 286.358, "r_y2": 351.761, "r_x3": 217.021, "r_y3": 351.761, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the", "orig": "Proceedings of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 370.45, "r_x1": 143.08, "r_y1": 370.45, "r_x2": 143.08, "r_y2": 362.72, "r_x3": 70.031, "r_y3": 362.72, "coord_origin": "TOPLEFT"}, "text": "24th ACM SIGKDD", "orig": "24th ACM SIGKDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.078, "r_y0": 370.579, "r_x1": 145.32, "r_y1": 370.579, "r_x2": 145.32, "r_y2": 362.882, "r_x3": 143.078, "r_y3": 362.882, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.108, "r_y0": 370.579, "r_x1": 286.361, "r_y1": 370.579, "r_x2": 286.361, "r_y2": 362.882, "r_x3": 148.108, "r_y3": 362.882, "coord_origin": "TOPLEFT"}, "text": "KDD '18, pages 774-782, New York,", "orig": "KDD '18, pages 774-782, New York,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 381.538, "r_x1": 161.157, "r_y1": 381.538, "r_x2": 161.157, "r_y2": 373.841, "r_x3": 70.031, "r_y3": 373.841, "coord_origin": "TOPLEFT"}, "text": "NY, USA, 2018. ACM. 1", "orig": "NY, USA, 2018. ACM. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 392.862, "r_x1": 65.05, "r_y1": 392.862, "r_x2": 65.05, "r_y2": 385.165, "r_x3": 50.112, "r_y3": 385.165, "coord_origin": "TOPLEFT"}, "text": "[31]", "orig": "[31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 392.862, "r_x1": 286.359, "r_y1": 392.862, "r_x2": 286.359, "r_y2": 385.165, "r_x3": 70.035, "r_y3": 385.165, "coord_origin": "TOPLEFT"}, "text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 403.821, "r_x1": 84.225, "r_y1": 403.821, "r_x2": 84.225, "r_y2": 396.124, "r_x3": 70.031, "r_y3": 396.124, "coord_origin": "TOPLEFT"}, "text": "reit,", "orig": "reit,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.489, "r_y0": 403.821, "r_x1": 286.363, "r_y1": 403.821, "r_x2": 286.363, "r_y2": 396.124, "r_x3": 87.489, "r_y3": 396.124, "coord_origin": "TOPLEFT"}, "text": "Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "orig": "Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 414.78, "r_x1": 78.997, "r_y1": 414.78, "r_x2": 78.997, "r_y2": 407.083, "r_x3": 70.031, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "lia", "orig": "lia", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.871, "r_y0": 414.78, "r_x1": 125.47, "r_y1": 414.78, "r_x2": 125.47, "r_y2": 407.083, "r_x3": 82.871, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "Polosukhin.", "orig": "Polosukhin.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 133.908, "r_y0": 414.78, "r_x1": 167.783, "r_y1": 414.78, "r_x2": 167.783, "r_y2": 407.083, "r_x3": 133.908, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.656, "r_y0": 414.78, "r_x1": 177.637, "r_y1": 414.78, "r_x2": 177.637, "r_y2": 407.083, "r_x3": 171.656, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.51, "r_y0": 414.78, "r_x1": 190.477, "r_y1": 414.78, "r_x2": 190.477, "r_y2": 407.083, "r_x3": 181.51, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.341, "r_y0": 414.78, "r_x1": 230.834, "r_y1": 414.78, "r_x2": 230.834, "r_y2": 407.083, "r_x3": 194.341, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "you need.", "orig": "you need.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.272, "r_y0": 414.78, "r_x1": 246.741, "r_y1": 414.78, "r_x2": 246.741, "r_y2": 407.083, "r_x3": 239.272, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.614, "r_y0": 414.78, "r_x1": 255.842, "r_y1": 414.78, "r_x2": 255.842, "r_y2": 407.083, "r_x3": 250.614, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "I.", "orig": "I.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.715, "r_y0": 414.78, "r_x1": 286.363, "r_y1": 414.78, "r_x2": 286.363, "r_y2": 407.083, "r_x3": 259.715, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "Guyon,", "orig": "Guyon,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 425.739, "r_x1": 286.363, "r_y1": 425.739, "r_x2": 286.363, "r_y2": 418.042, "r_x3": 70.031, "r_y3": 418.042, "coord_origin": "TOPLEFT"}, "text": "U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "orig": "U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 436.697, "r_x1": 196.762, "r_y1": 436.697, "r_x2": 196.762, "r_y2": 429.0, "r_x3": 70.031, "r_y3": 429.0, "coord_origin": "TOPLEFT"}, "text": "wanathan, and R. Garnett, editors,", "orig": "wanathan, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.202, "r_y0": 436.568, "r_x1": 286.36, "r_y1": 436.568, "r_x2": 286.36, "r_y2": 428.838, "r_x3": 200.202, "r_y3": 428.838, "coord_origin": "TOPLEFT"}, "text": "Advances in Neural In-", "orig": "Advances in Neural In-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 447.527, "r_x1": 189.194, "r_y1": 447.527, "r_x2": 189.194, "r_y2": 439.797, "r_x3": 70.031, "r_y3": 439.797, "coord_origin": "TOPLEFT"}, "text": "formation Processing Systems 30", "orig": "formation Processing Systems 30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 189.195, "r_y0": 447.656, "r_x1": 191.437, "r_y1": 447.656, "r_x2": 191.437, "r_y2": 439.959, "r_x3": 189.195, "r_y3": 439.959, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.795, "r_y0": 447.656, "r_x1": 286.364, "r_y1": 447.656, "r_x2": 286.364, "r_y2": 439.959, "r_x3": 193.795, "r_y3": 439.959, "coord_origin": "TOPLEFT"}, "text": "pages 5998-6008. Curran", "orig": "pages 5998-6008. Curran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 458.615, "r_x1": 158.924, "r_y1": 458.615, "r_x2": 158.924, "r_y2": 450.918, "r_x3": 70.031, "r_y3": 450.918, "coord_origin": "TOPLEFT"}, "text": "Associates, Inc., 2017. 5", "orig": "Associates, Inc., 2017. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 469.939, "r_x1": 65.05, "r_y1": 469.939, "r_x2": 65.05, "r_y2": 462.242, "r_x3": 50.112, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "[32]", "orig": "[32]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 469.939, "r_x1": 88.963, "r_y1": 469.939, "r_x2": 88.963, "r_y2": 462.242, "r_x3": 70.035, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "Oriol", "orig": "Oriol", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.81, "r_y0": 469.939, "r_x1": 122.274, "r_y1": 469.939, "r_x2": 122.274, "r_y2": 462.242, "r_x3": 92.81, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "Vinyals,", "orig": "Vinyals,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 126.524, "r_y0": 469.939, "r_x1": 194.695, "r_y1": 469.939, "r_x2": 194.695, "r_y2": 462.242, "r_x3": 126.524, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "Alexander Toshev,", "orig": "Alexander Toshev,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.954, "r_y0": 469.939, "r_x1": 286.359, "r_y1": 469.939, "r_x2": 286.359, "r_y2": 462.242, "r_x3": 198.954, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "Samy Bengio, and Du-", "orig": "Samy Bengio, and Du-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 480.898, "r_x1": 116.28, "r_y1": 480.898, "r_x2": 116.28, "r_y2": 473.201, "r_x3": 70.031, "r_y3": 473.201, "coord_origin": "TOPLEFT"}, "text": "mitru Erhan.", "orig": "mitru Erhan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.484, "r_y0": 480.898, "r_x1": 175.924, "r_y1": 480.898, "r_x2": 175.924, "r_y2": 473.201, "r_x3": 122.484, "r_y3": 473.201, "coord_origin": "TOPLEFT"}, "text": "Show and tell:", "orig": "Show and tell:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.56, "r_y0": 480.898, "r_x1": 286.363, "r_y1": 480.898, "r_x2": 286.363, "r_y2": 473.201, "r_x3": 180.56, "r_y3": 473.201, "coord_origin": "TOPLEFT"}, "text": "A neural image caption gen-", "orig": "A neural image caption gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 491.857, "r_x1": 103.305, "r_y1": 491.857, "r_x2": 103.305, "r_y2": 484.16, "r_x3": 70.031, "r_y3": 484.16, "coord_origin": "TOPLEFT"}, "text": "erator. In", "orig": "erator. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 105.516, "r_y0": 491.728, "r_x1": 286.359, "r_y1": 491.728, "r_x2": 286.359, "r_y2": 483.998, "r_x3": 105.516, "r_y3": 483.998, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE Conference on Computer", "orig": "Proceedings of the IEEE Conference on Computer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 502.687, "r_x1": 212.516, "r_y1": 502.687, "r_x2": 212.516, "r_y2": 494.957, "r_x3": 70.031, "r_y3": 494.957, "coord_origin": "TOPLEFT"}, "text": "Vision and Pattern Recognition (CVPR)", "orig": "Vision and Pattern Recognition (CVPR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.514, "r_y0": 502.816, "r_x1": 263.56, "r_y1": 502.816, "r_x2": 263.56, "r_y2": 495.119, "r_x3": 212.514, "r_y3": 495.119, "coord_origin": "TOPLEFT"}, "text": ", June 2015. 2", "orig": ", June 2015. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 514.14, "r_x1": 65.05, "r_y1": 514.14, "r_x2": 65.05, "r_y2": 506.443, "r_x3": 50.112, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "[33]", "orig": "[33]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 514.14, "r_x1": 247.373, "r_y1": 514.14, "r_x2": 247.373, "r_y2": 506.443, "r_x3": 70.035, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 253.972, "r_y0": 514.14, "r_x1": 286.359, "r_y1": 514.14, "r_x2": 286.359, "r_y2": 506.443, "r_x3": 253.972, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "Res2tim:", "orig": "Res2tim:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 525.0989999999999, "r_x1": 253.125, "r_y1": 525.0989999999999, "r_x2": 253.125, "r_y2": 517.402, "r_x3": 70.031, "r_y3": 517.402, "coord_origin": "TOPLEFT"}, "text": "reconstruct syntactic structures from table images.", "orig": "reconstruct syntactic structures from table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 258.155, "r_y0": 525.0989999999999, "r_x1": 265.624, "r_y1": 525.0989999999999, "r_x2": 265.624, "r_y2": 517.402, "r_x3": 258.155, "r_y3": 517.402, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 268.429, "r_y0": 524.97, "r_x1": 286.362, "r_y1": 524.97, "r_x2": 286.362, "r_y2": 517.24, "r_x3": 268.429, "r_y3": 517.24, "coord_origin": "TOPLEFT"}, "text": "2019", "orig": "2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 535.929, "r_x1": 286.363, "r_y1": 535.929, "r_x2": 286.363, "r_y2": 528.1990000000001, "r_x3": 70.031, "r_y3": 528.1990000000001, "coord_origin": "TOPLEFT"}, "text": "International Conference on Document Analysis and Recog-", "orig": "International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 546.887, "r_x1": 125.255, "r_y1": 546.887, "r_x2": 125.255, "r_y2": 539.157, "r_x3": 70.031, "r_y3": 539.157, "coord_origin": "TOPLEFT"}, "text": "nition (ICDAR)", "orig": "nition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.254, "r_y0": 547.016, "r_x1": 240.051, "r_y1": 547.016, "r_x2": 240.051, "r_y2": 539.319, "r_x3": 125.254, "r_y3": 539.319, "coord_origin": "TOPLEFT"}, "text": ", pages 749-755. IEEE, 2019. 3", "orig": ", pages 749-755. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 558.34, "r_x1": 65.05, "r_y1": 558.34, "r_x2": 65.05, "r_y2": 550.643, "r_x3": 50.112, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "[34]", "orig": "[34]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 558.34, "r_x1": 125.008, "r_y1": 558.34, "r_x2": 125.008, "r_y2": 550.643, "r_x3": 70.035, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "Wenyuan Xue,", "orig": "Wenyuan Xue,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.823, "r_y0": 558.34, "r_x1": 181.676, "r_y1": 558.34, "r_x2": 181.676, "r_y2": 550.643, "r_x3": 129.823, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "Baosheng Yu,", "orig": "Baosheng Yu,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 186.491, "r_y0": 558.34, "r_x1": 286.359, "r_y1": 558.34, "r_x2": 286.359, "r_y2": 550.643, "r_x3": 186.491, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "Wen Wang, Dacheng Tao,", "orig": "Wen Wang, Dacheng Tao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 569.299, "r_x1": 137.082, "r_y1": 569.299, "r_x2": 137.082, "r_y2": 561.602, "r_x3": 70.031, "r_y3": 561.602, "coord_origin": "TOPLEFT"}, "text": "and Qingyong Li.", "orig": "and Qingyong Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.985, "r_y0": 569.299, "r_x1": 172.382, "r_y1": 569.299, "r_x2": 172.382, "r_y2": 561.602, "r_x3": 145.985, "r_y3": 561.602, "coord_origin": "TOPLEFT"}, "text": "Tgrnet:", "orig": "Tgrnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.704, "r_y0": 569.299, "r_x1": 206.625, "r_y1": 569.299, "r_x2": 206.625, "r_y2": 561.602, "r_x3": 178.704, "r_y3": 561.602, "coord_origin": "TOPLEFT"}, "text": "A table", "orig": "A table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.633, "r_y0": 569.299, "r_x1": 286.363, "r_y1": 569.299, "r_x2": 286.363, "r_y2": 561.602, "r_x3": 210.633, "r_y3": 561.602, "coord_origin": "TOPLEFT"}, "text": "graph reconstruction", "orig": "graph reconstruction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 580.258, "r_x1": 99.324, "r_y1": 580.258, "r_x2": 99.324, "r_y2": 572.561, "r_x3": 70.031, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 104.157, "r_y0": 580.258, "r_x1": 114.612, "r_y1": 580.258, "r_x2": 114.612, "r_y2": 572.561, "r_x3": 104.157, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.454, "r_y0": 580.258, "r_x1": 136.884, "r_y1": 580.258, "r_x2": 136.884, "r_y2": 572.561, "r_x3": 119.454, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.717, "r_y0": 580.258, "r_x1": 173.091, "r_y1": 580.258, "r_x2": 173.091, "r_y2": 572.561, "r_x3": 141.717, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.933, "r_y0": 580.258, "r_x1": 221.007, "r_y1": 580.258, "r_x2": 221.007, "r_y2": 572.561, "r_x3": 177.933, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.543, "r_y0": 580.129, "r_x1": 252.466, "r_y1": 580.129, "r_x2": 252.466, "r_y2": 572.399, "r_x3": 232.543, "r_y3": 572.399, "coord_origin": "TOPLEFT"}, "text": "arXiv", "orig": "arXiv", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.299, "r_y0": 580.129, "r_x1": 286.359, "r_y1": 580.129, "r_x2": 286.359, "r_y2": 572.399, "r_x3": 257.299, "r_y3": 572.399, "coord_origin": "TOPLEFT"}, "text": "preprint", "orig": "preprint", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 591.088, "r_x1": 135.531, "r_y1": 591.088, "r_x2": 135.531, "r_y2": 583.358, "r_x3": 70.031, "r_y3": 583.358, "coord_origin": "TOPLEFT"}, "text": "arXiv:2106.10598", "orig": "arXiv:2106.10598", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 135.53, "r_y0": 591.217, "r_x1": 167.899, "r_y1": 591.217, "r_x2": 167.899, "r_y2": 583.52, "r_x3": 135.53, "r_y3": 583.52, "coord_origin": "TOPLEFT"}, "text": ", 2021. 3", "orig": ", 2021. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 602.5409999999999, "r_x1": 65.05, "r_y1": 602.5409999999999, "r_x2": 65.05, "r_y2": 594.844, "r_x3": 50.112, "r_y3": 594.844, "coord_origin": "TOPLEFT"}, "text": "[35]", "orig": "[35]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 602.5409999999999, "r_x1": 286.359, "r_y1": 602.5409999999999, "r_x2": 286.359, "r_y2": 594.844, "r_x3": 70.035, "r_y3": 594.844, "coord_origin": "TOPLEFT"}, "text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 613.5, "r_x1": 109.107, "r_y1": 613.5, "r_x2": 109.107, "r_y2": 605.803, "r_x3": 70.031, "r_y3": 605.803, "coord_origin": "TOPLEFT"}, "text": "Jiebo Luo.", "orig": "Jiebo Luo.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.226, "r_y0": 613.5, "r_x1": 271.766, "r_y1": 613.5, "r_x2": 271.766, "r_y2": 605.803, "r_x3": 116.226, "r_y3": 605.803, "coord_origin": "TOPLEFT"}, "text": "Image captioning with semantic attention.", "orig": "Image captioning with semantic attention.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.894, "r_y0": 613.5, "r_x1": 286.363, "r_y1": 613.5, "r_x2": 286.363, "r_y2": 605.803, "r_x3": 278.894, "r_y3": 605.803, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 624.33, "r_x1": 286.363, "r_y1": 624.33, "r_x2": 286.363, "r_y2": 616.6, "r_x3": 70.031, "r_y3": 616.6, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE conference on computer vision and", "orig": "Proceedings of the IEEE conference on computer vision and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 635.289, "r_x1": 139.099, "r_y1": 635.289, "r_x2": 139.099, "r_y2": 627.559, "r_x3": 70.031, "r_y3": 627.559, "coord_origin": "TOPLEFT"}, "text": "pattern recognition", "orig": "pattern recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.098, "r_y0": 635.418, "r_x1": 238.957, "r_y1": 635.418, "r_x2": 238.957, "r_y2": 627.721, "r_x3": 139.098, "r_y3": 627.721, "coord_origin": "TOPLEFT"}, "text": ", pages 4651-4659, 2016. 4", "orig": ", pages 4651-4659, 2016. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 646.742, "r_x1": 65.05, "r_y1": 646.742, "r_x2": 65.05, "r_y2": 639.045, "r_x3": 50.112, "r_y3": 639.045, "coord_origin": "TOPLEFT"}, "text": "[36]", "orig": "[36]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 646.742, "r_x1": 286.359, "r_y1": 646.742, "r_x2": 286.359, "r_y2": 639.045, "r_x3": 70.035, "r_y3": 639.045, "coord_origin": "TOPLEFT"}, "text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 657.7, "r_x1": 286.363, "r_y1": 657.7, "r_x2": 286.363, "r_y2": 650.0029999999999, "r_x3": 70.031, "r_y3": 650.0029999999999, "coord_origin": "TOPLEFT"}, "text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 668.659, "r_x1": 286.363, "r_y1": 668.659, "r_x2": 286.363, "r_y2": 660.962, "r_x3": 70.031, "r_y3": 660.962, "coord_origin": "TOPLEFT"}, "text": "work for joint table identification and cell structure recogni-", "orig": "work for joint table identification and cell structure recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 679.6179999999999, "r_x1": 158.458, "r_y1": 679.6179999999999, "r_x2": 158.458, "r_y2": 671.921, "r_x3": 70.031, "r_y3": 671.921, "coord_origin": "TOPLEFT"}, "text": "tion using visual context.", "orig": "tion using visual context.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.528, "r_y0": 679.489, "r_x1": 286.362, "r_y1": 679.489, "r_x2": 286.362, "r_y2": 671.759, "r_x3": 160.528, "r_y3": 671.759, "coord_origin": "TOPLEFT"}, "text": "Winter Conference for Applications", "orig": "Winter Conference for Applications", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 690.448, "r_x1": 171.423, "r_y1": 690.448, "r_x2": 171.423, "r_y2": 682.718, "r_x3": 70.031, "r_y3": 682.718, "coord_origin": "TOPLEFT"}, "text": "in Computer Vision (WACV)", "orig": "in Computer Vision (WACV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.422, "r_y0": 690.577, "r_x1": 212.757, "r_y1": 690.577, "r_x2": 212.757, "r_y2": 682.88, "r_x3": 171.422, "r_y3": 682.88, "coord_origin": "TOPLEFT"}, "text": ", 2021. 2, 3", "orig": ", 2021. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.901, "r_x1": 65.05, "r_y1": 701.901, "r_x2": 65.05, "r_y2": 694.204, "r_x3": 50.112, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "[37]", "orig": "[37]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 701.901, "r_x1": 80.992, "r_y1": 701.901, "r_x2": 80.992, "r_y2": 694.204, "r_x3": 70.035, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Xu", "orig": "Xu", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 89.062, "r_y0": 701.901, "r_x1": 114.715, "r_y1": 701.901, "r_x2": 114.715, "r_y2": 694.204, "r_x3": 89.062, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Zhong,", "orig": "Zhong,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.246, "r_y0": 701.901, "r_x1": 149.146, "r_y1": 701.901, "r_x2": 149.146, "r_y2": 694.204, "r_x3": 124.246, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Elaheh", "orig": "Elaheh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.225, "r_y0": 701.901, "r_x1": 209.373, "r_y1": 701.901, "r_x2": 209.373, "r_y2": 694.204, "r_x3": 157.225, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "ShafieiBavani,", "orig": "ShafieiBavani,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 218.904, "r_y0": 701.901, "r_x1": 231.852, "r_y1": 701.901, "r_x2": 231.852, "r_y2": 694.204, "r_x3": 218.904, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.931, "r_y0": 701.901, "r_x1": 269.323, "r_y1": 701.901, "r_x2": 269.323, "r_y2": 694.204, "r_x3": 239.931, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Antonio", "orig": "Antonio", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 277.392, "r_y0": 701.901, "r_x1": 286.359, "r_y1": 701.901, "r_x2": 286.359, "r_y2": 694.204, "r_x3": 277.392, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Ji-", "orig": "Ji-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 712.86, "r_x1": 116.719, "r_y1": 712.86, "r_x2": 116.719, "r_y2": 705.163, "r_x3": 70.031, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "meno Yepes.", "orig": "meno Yepes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.413, "r_y0": 712.86, "r_x1": 235.013, "r_y1": 712.86, "r_x2": 235.013, "r_y2": 705.163, "r_x3": 122.413, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "Image-based table recognition:", "orig": "Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.335, "r_y0": 712.86, "r_x1": 286.363, "r_y1": 712.86, "r_x2": 286.363, "r_y2": 705.163, "r_x3": 239.335, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "Data, model,", "orig": "Data, model,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 83.82299999999998, "r_x1": 383.646, "r_y1": 83.82299999999998, "r_x2": 383.646, "r_y2": 76.12599999999998, "r_x3": 328.781, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "and evaluation.", "orig": "and evaluation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 388.56, "r_y0": 83.82299999999998, "r_x1": 545.113, "r_y1": 83.82299999999998, "r_x2": 545.113, "r_y2": 76.12599999999998, "r_x3": 388.56, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "In Andrea Vedaldi, Horst Bischof, Thomas", "orig": "In Andrea Vedaldi, Horst Bischof, Thomas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 94.78099999999995, "r_x1": 472.306, "r_y1": 94.78099999999995, "r_x2": 472.306, "r_y2": 87.08399999999995, "r_x3": 328.781, "r_y3": 87.08399999999995, "coord_origin": "TOPLEFT"}, "text": "Brox, and Jan-Michael Frahm, editors,", "orig": "Brox, and Jan-Michael Frahm, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.885, "r_y0": 94.65200000000004, "r_x1": 545.115, "r_y1": 94.65200000000004, "r_x2": 545.115, "r_y2": 86.92200000000003, "r_x3": 475.885, "r_y3": 86.92200000000003, "coord_origin": "TOPLEFT"}, "text": "Computer Vision -", "orig": "Computer Vision -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 105.61099999999999, "r_x1": 371.927, "r_y1": 105.61099999999999, "r_x2": 371.927, "r_y2": 97.88099999999997, "r_x3": 328.781, "r_y3": 97.88099999999997, "coord_origin": "TOPLEFT"}, "text": "ECCV 2020", "orig": "ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 371.926, "r_y0": 105.74000000000001, "r_x1": 374.168, "r_y1": 105.74000000000001, "r_x2": 374.168, "r_y2": 98.043, "r_x3": 371.926, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.472, "r_y0": 105.74000000000001, "r_x1": 545.112, "r_y1": 105.74000000000001, "r_x2": 545.112, "r_y2": 98.043, "r_x3": 376.472, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "pages 564-580, Cham, 2020. Springer Interna-", "orig": "pages 564-580, Cham, 2020. Springer Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 116.69899999999996, "r_x1": 417.701, "r_y1": 116.69899999999996, "r_x2": 417.701, "r_y2": 109.00199999999995, "r_x3": 328.781, "r_y3": 109.00199999999995, "coord_origin": "TOPLEFT"}, "text": "tional Publishing. 2, 3, 7", "orig": "tional Publishing. 2, 3, 7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 128.654, "r_x1": 323.8, "r_y1": 128.654, "r_x2": 323.8, "r_y2": 120.957, "r_x3": 308.862, "r_y3": 120.957, "coord_origin": "TOPLEFT"}, "text": "[38]", "orig": "[38]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 128.654, "r_x1": 523.15, "r_y1": 128.654, "r_x2": 523.15, "r_y2": 120.957, "r_x3": 328.785, "r_y3": 120.957, "coord_origin": "TOPLEFT"}, "text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes.", "orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.171, "r_y0": 128.654, "r_x1": 545.109, "r_y1": 128.654, "r_x2": 545.109, "r_y2": 120.957, "r_x3": 528.171, "r_y3": 120.957, "coord_origin": "TOPLEFT"}, "text": "Pub-", "orig": "Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 139.61300000000006, "r_x1": 545.113, "r_y1": 139.61300000000006, "r_x2": 545.113, "r_y2": 131.91600000000005, "r_x3": 328.781, "r_y3": 131.91600000000005, "coord_origin": "TOPLEFT"}, "text": "laynet: Largest dataset ever for document layout analysis. In", "orig": "laynet: Largest dataset ever for document layout analysis. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 150.44299999999998, "r_x1": 545.113, "r_y1": 150.44299999999998, "r_x2": 545.113, "r_y2": 142.71299999999997, "r_x3": 328.781, "r_y3": 142.71299999999997, "coord_origin": "TOPLEFT"}, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 161.40200000000004, "r_x1": 406.322, "r_y1": 161.40200000000004, "r_x2": 406.322, "r_y2": 153.67200000000003, "r_x3": 328.781, "r_y3": 153.67200000000003, "coord_origin": "TOPLEFT"}, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 406.322, "r_y0": 161.53099999999995, "r_x1": 506.181, "r_y1": 161.53099999999995, "r_x2": 506.181, "r_y2": 153.83399999999995, "r_x3": 406.322, "r_y3": 153.83399999999995, "coord_origin": "TOPLEFT"}, "text": ", pages 1015-1022, 2019. 1", "orig": ", pages 1015-1022, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.63, "r_y0": 742.954, "r_x1": 302.593, "r_y1": 742.954, "r_x2": 302.593, "r_y2": 734.402, "r_x3": 292.63, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 15, "label": "text", "bbox": {"l": 70.031, "t": 75.96400000000006, "r": 286.362, "b": 94.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.6886764168739319, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 83.69399999999996, "r_x1": 223.581, "r_y1": 83.69399999999996, "r_x2": 223.581, "r_y2": 75.96400000000006, "r_x3": 70.031, "r_y3": 75.96400000000006, "coord_origin": "TOPLEFT"}, "text": "Computer Vision and Pattern Recognition", "orig": "Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 223.579, "r_y0": 83.82299999999998, "r_x1": 225.821, "r_y1": 83.82299999999998, "r_x2": 225.821, "r_y2": 76.12599999999998, "r_x3": 223.579, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.183, "r_y0": 83.82299999999998, "r_x1": 286.362, "r_y1": 83.82299999999998, "r_x2": 286.362, "r_y2": 76.12599999999998, "r_x3": 229.183, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "pages 658-666,", "orig": "pages 658-666,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 94.78200000000004, "r_x1": 97.917, "r_y1": 94.78200000000004, "r_x2": 97.917, "r_y2": 87.08500000000004, "r_x3": 70.031, "r_y3": 87.08500000000004, "coord_origin": "TOPLEFT"}, "text": "2019. 6", "orig": "2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "list_item", "bbox": {"l": 50.112, "t": 98.40800000000002, "r": 286.366, "b": 160.89999999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.7723011374473572, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 106.10500000000002, "r_x1": 65.05, "r_y1": 106.10500000000002, "r_x2": 65.05, "r_y2": 98.40800000000002, "r_x3": 50.112, "r_y3": 98.40800000000002, "coord_origin": "TOPLEFT"}, "text": "[26]", "orig": "[26]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 106.10500000000002, "r_x1": 286.359, "r_y1": 106.10500000000002, "r_x2": 286.359, "r_y2": 98.40800000000002, "r_x3": 70.035, "r_y3": 98.40800000000002, "coord_origin": "TOPLEFT"}, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 117.06399999999996, "r_x1": 286.363, "r_y1": 117.06399999999996, "r_x2": 286.363, "r_y2": 109.36699999999996, "r_x3": 70.031, "r_y3": 109.36699999999996, "coord_origin": "TOPLEFT"}, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 128.02300000000002, "r_x1": 286.363, "r_y1": 128.02300000000002, "r_x2": 286.363, "r_y2": 120.32600000000002, "r_x3": 70.031, "r_y3": 120.32600000000002, "coord_origin": "TOPLEFT"}, "text": "tion and structure recognition of tables in document images.", "orig": "tion and structure recognition of tables in document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 138.98199999999997, "r_x1": 77.5, "r_y1": 138.98199999999997, "r_x2": 77.5, "r_y2": 131.28499999999997, "r_x3": 70.031, "r_y3": 131.28499999999997, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 80.56, "r_y0": 138.85299999999995, "r_x1": 286.366, "r_y1": 138.85299999999995, "r_x2": 286.366, "r_y2": 131.12300000000005, "r_x3": 80.56, "r_y3": 131.12300000000005, "coord_origin": "TOPLEFT"}, "text": "2017 14th IAPR International Conference on Document", "orig": "2017 14th IAPR International Conference on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 149.812, "r_x1": 195.229, "r_y1": 149.812, "r_x2": 195.229, "r_y2": 142.082, "r_x3": 70.031, "r_y3": 142.082, "coord_origin": "TOPLEFT"}, "text": "Analysis and Recognition (ICDAR)", "orig": "Analysis and Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.231, "r_y0": 149.94100000000003, "r_x1": 286.365, "r_y1": 149.94100000000003, "r_x2": 286.365, "r_y2": 142.24400000000003, "r_x3": 195.231, "r_y3": 142.24400000000003, "coord_origin": "TOPLEFT"}, "text": ", volume 01, pages 1162-", "orig": ", volume 01, pages 1162-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 160.89999999999998, "r_x1": 120.333, "r_y1": 160.89999999999998, "r_x2": 120.333, "r_y2": 153.20299999999997, "r_x3": 70.031, "r_y3": 153.20299999999997, "coord_origin": "TOPLEFT"}, "text": "1167, 2017. 1", "orig": "1167, 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "list_item", "bbox": {"l": 50.112, "t": 164.52700000000004, "r": 286.363, "b": 227.01800000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.8580600619316101, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 172.22400000000005, "r_x1": 65.05, "r_y1": 172.22400000000005, "r_x2": 65.05, "r_y2": 164.52700000000004, "r_x3": 50.112, "r_y3": 164.52700000000004, "coord_origin": "TOPLEFT"}, "text": "[27]", "orig": "[27]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 172.22400000000005, "r_x1": 286.359, "r_y1": 172.22400000000005, "r_x2": 286.359, "r_y2": 164.52700000000004, "r_x3": 70.035, "r_y3": 164.52700000000004, "coord_origin": "TOPLEFT"}, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 183.183, "r_x1": 158.395, "r_y1": 183.183, "r_x2": 158.395, "r_y2": 175.486, "r_x3": 70.031, "r_y3": 175.486, "coord_origin": "TOPLEFT"}, "text": "gel, and Sheraz Ahmed.", "orig": "gel, and Sheraz Ahmed.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.035, "r_y0": 183.183, "r_x1": 202.877, "r_y1": 183.183, "r_x2": 202.877, "r_y2": 175.486, "r_x3": 164.035, "r_y3": 175.486, "coord_origin": "TOPLEFT"}, "text": "Deepdesrt:", "orig": "Deepdesrt:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.163, "r_y0": 183.183, "r_x1": 286.363, "r_y1": 183.183, "r_x2": 286.363, "r_y2": 175.486, "r_x3": 207.163, "r_y3": 175.486, "coord_origin": "TOPLEFT"}, "text": "Deep learning for de-", "orig": "Deep learning for de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 194.14200000000005, "r_x1": 286.363, "r_y1": 194.14200000000005, "r_x2": 286.363, "r_y2": 186.44500000000005, "r_x3": 70.031, "r_y3": 186.44500000000005, "coord_origin": "TOPLEFT"}, "text": "tection and structure recognition of tables in document im-", "orig": "tection and structure recognition of tables in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 205.101, "r_x1": 88.206, "r_y1": 205.101, "r_x2": 88.206, "r_y2": 197.404, "r_x3": 70.031, "r_y3": 197.404, "coord_origin": "TOPLEFT"}, "text": "ages.", "orig": "ages.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.864, "r_y0": 205.101, "r_x1": 101.333, "r_y1": 205.101, "r_x2": 101.333, "r_y2": 197.404, "r_x3": 93.864, "r_y3": 197.404, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 104.331, "r_y0": 204.97199999999998, "r_x1": 286.358, "r_y1": 204.97199999999998, "r_x2": 286.358, "r_y2": 197.24199999999996, "r_x3": 104.331, "r_y3": 197.24199999999996, "coord_origin": "TOPLEFT"}, "text": "2017 14th IAPR international conference on doc-", "orig": "2017 14th IAPR international conference on doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 215.92999999999995, "r_x1": 220.487, "r_y1": 215.92999999999995, "r_x2": 220.487, "r_y2": 208.20000000000005, "r_x3": 70.031, "r_y3": 208.20000000000005, "coord_origin": "TOPLEFT"}, "text": "ument analysis and recognition (ICDAR)", "orig": "ument analysis and recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.484, "r_y0": 216.05899999999997, "r_x1": 222.726, "r_y1": 216.05899999999997, "r_x2": 222.726, "r_y2": 208.36199999999997, "r_x3": 220.484, "r_y3": 208.36199999999997, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 225.909, "r_y0": 216.05899999999997, "r_x1": 286.36, "r_y1": 216.05899999999997, "r_x2": 286.36, "r_y2": 208.36199999999997, "r_x3": 225.909, "r_y3": 208.36199999999997, "coord_origin": "TOPLEFT"}, "text": "volume 1, pages", "orig": "volume 1, pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 227.01800000000003, "r_x1": 166.653, "r_y1": 227.01800000000003, "r_x2": 166.653, "r_y2": 219.32100000000003, "r_x3": 70.031, "r_y3": 219.32100000000003, "coord_origin": "TOPLEFT"}, "text": "1162-1167. IEEE, 2017. 3", "orig": "1162-1167. IEEE, 2017. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "list_item", "bbox": {"l": 50.112, "t": 230.64499999999998, "r": 286.366, "b": 271.21900000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.8512731194496155, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 238.34199999999998, "r_x1": 65.05, "r_y1": 238.34199999999998, "r_x2": 65.05, "r_y2": 230.64499999999998, "r_x3": 50.112, "r_y3": 230.64499999999998, "coord_origin": "TOPLEFT"}, "text": "[28]", "orig": "[28]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 238.34199999999998, "r_x1": 179.147, "r_y1": 238.34199999999998, "r_x2": 179.147, "r_y2": 230.64499999999998, "r_x3": 70.035, "r_y3": 230.64499999999998, "coord_origin": "TOPLEFT"}, "text": "Faisal Shafait and Ray Smith.", "orig": "Faisal Shafait and Ray Smith.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.366, "r_y0": 238.34199999999998, "r_x1": 286.359, "r_y1": 238.34199999999998, "r_x2": 286.359, "r_y2": 230.64499999999998, "r_x3": 184.366, "r_y3": 230.64499999999998, "coord_origin": "TOPLEFT"}, "text": "Table detection in heteroge-", "orig": "Table detection in heteroge-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 249.30100000000004, "r_x1": 134.804, "r_y1": 249.30100000000004, "r_x2": 134.804, "r_y2": 241.60400000000004, "r_x3": 70.031, "r_y3": 241.60400000000004, "coord_origin": "TOPLEFT"}, "text": "neous documents.", "orig": "neous documents.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.7, "r_y0": 249.30100000000004, "r_x1": 147.169, "r_y1": 249.30100000000004, "r_x2": 147.169, "r_y2": 241.60400000000004, "r_x3": 139.7, "r_y3": 241.60400000000004, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.933, "r_y0": 249.17200000000003, "r_x1": 286.366, "r_y1": 249.17200000000003, "r_x2": 286.366, "r_y2": 241.442, "r_x3": 149.933, "r_y3": 241.442, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the 9th IAPR Interna-", "orig": "Proceedings of the 9th IAPR Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 260.131, "r_x1": 244.688, "r_y1": 260.131, "r_x2": 244.688, "r_y2": 252.40099999999995, "r_x3": 70.031, "r_y3": 252.40099999999995, "coord_origin": "TOPLEFT"}, "text": "tional Workshop on Document Analysis Systems", "orig": "tional Workshop on Document Analysis Systems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 244.691, "r_y0": 260.26, "r_x1": 246.933, "r_y1": 260.26, "r_x2": 246.933, "r_y2": 252.563, "r_x3": 244.691, "r_y3": 252.563, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.775, "r_y0": 260.26, "r_x1": 286.358, "r_y1": 260.26, "r_x2": 286.358, "r_y2": 252.563, "r_x3": 249.775, "r_y3": 252.563, "coord_origin": "TOPLEFT"}, "text": "pages 65-", "orig": "pages 65-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 271.21900000000005, "r_x1": 111.366, "r_y1": 271.21900000000005, "r_x2": 111.366, "r_y2": 263.52200000000005, "r_x3": 70.031, "r_y3": 263.52200000000005, "coord_origin": "TOPLEFT"}, "text": "72, 2010. 2", "orig": "72, 2010. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "list_item", "bbox": {"l": 50.112, "t": 274.846, "r": 286.366, "b": 326.378, "coord_origin": "TOPLEFT"}, "confidence": 0.8494512438774109, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 282.543, "r_x1": 65.05, "r_y1": 282.543, "r_x2": 65.05, "r_y2": 274.846, "r_x3": 50.112, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "[29]", "orig": "[29]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 282.543, "r_x1": 94.944, "r_y1": 282.543, "r_x2": 94.944, "r_y2": 274.846, "r_x3": 70.035, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Shoaib", "orig": "Shoaib", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 100.871, "r_y0": 282.543, "r_x1": 127.268, "r_y1": 282.543, "r_x2": 127.268, "r_y2": 274.846, "r_x3": 100.871, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Ahmed", "orig": "Ahmed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 133.195, "r_y0": 282.543, "r_x1": 165.832, "r_y1": 282.543, "r_x2": 165.832, "r_y2": 274.846, "r_x3": 133.195, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Siddiqui,", "orig": "Siddiqui,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.683, "r_y0": 282.543, "r_x1": 194.094, "r_y1": 282.543, "r_x2": 194.094, "r_y2": 274.846, "r_x3": 172.683, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Imran", "orig": "Imran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.021, "r_y0": 282.543, "r_x1": 211.48, "r_y1": 282.543, "r_x2": 211.48, "r_y2": 274.846, "r_x3": 200.021, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Ali", "orig": "Ali", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.407, "r_y0": 282.543, "r_x1": 239.438, "r_y1": 282.543, "r_x2": 239.438, "r_y2": 274.846, "r_x3": 217.407, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Fateh,", "orig": "Fateh,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.288, "r_y0": 282.543, "r_x1": 264.221, "r_y1": 282.543, "r_x2": 264.221, "r_y2": 274.846, "r_x3": 246.288, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Syed", "orig": "Syed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.147, "r_y0": 282.543, "r_x1": 286.359, "r_y1": 282.543, "r_x2": 286.359, "r_y2": 274.846, "r_x3": 270.147, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Tah-", "orig": "Tah-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 293.502, "r_x1": 85.964, "r_y1": 293.502, "r_x2": 85.964, "r_y2": 285.805, "r_x3": 70.031, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "seen", "orig": "seen", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.021, "r_y0": 293.502, "r_x1": 108.945, "r_y1": 293.502, "r_x2": 108.945, "r_y2": 285.805, "r_x3": 91.021, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Raza", "orig": "Raza", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 114.002, "r_y0": 293.502, "r_x1": 135.674, "r_y1": 293.502, "r_x2": 135.674, "r_y2": 285.805, "r_x3": 114.002, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Rizvi,", "orig": "Rizvi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.43, "r_y0": 293.502, "r_x1": 171.306, "r_y1": 293.502, "r_x2": 171.306, "r_y2": 285.805, "r_x3": 141.43, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Andreas", "orig": "Andreas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.364, "r_y0": 293.502, "r_x1": 204.5, "r_y1": 293.502, "r_x2": 204.5, "r_y2": 285.805, "r_x3": 176.364, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Dengel,", "orig": "Dengel,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.265, "r_y0": 293.502, "r_x1": 223.213, "r_y1": 293.502, "r_x2": 223.213, "r_y2": 285.805, "r_x3": 210.265, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.27, "r_y0": 293.502, "r_x1": 252.668, "r_y1": 293.502, "r_x2": 252.668, "r_y2": 285.805, "r_x3": 228.27, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Sheraz", "orig": "Sheraz", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.725, "r_y0": 293.502, "r_x1": 286.363, "r_y1": 293.502, "r_x2": 286.363, "r_y2": 285.805, "r_x3": 257.725, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Ahmed.", "orig": "Ahmed.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 304.461, "r_x1": 286.363, "r_y1": 304.461, "r_x2": 286.363, "r_y2": 296.764, "r_x3": 70.031, "r_y3": 296.764, "coord_origin": "TOPLEFT"}, "text": "Deeptabstr: Deep learning based table structure recognition.", "orig": "Deeptabstr: Deep learning based table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 315.42, "r_x1": 77.5, "r_y1": 315.42, "r_x2": 77.5, "r_y2": 307.723, "r_x3": 70.031, "r_y3": 307.723, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 79.35, "r_y0": 315.291, "r_x1": 286.366, "r_y1": 315.291, "r_x2": 286.366, "r_y2": 307.561, "r_x3": 79.35, "r_y3": 307.561, "coord_origin": "TOPLEFT"}, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 326.249, "r_x1": 147.572, "r_y1": 326.249, "r_x2": 147.572, "r_y2": 318.519, "r_x3": 70.031, "r_y3": 318.519, "coord_origin": "TOPLEFT"}, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.572, "r_y0": 326.378, "r_x1": 271.335, "r_y1": 326.378, "r_x2": 271.335, "r_y2": 318.681, "r_x3": 147.572, "r_y3": 318.681, "coord_origin": "TOPLEFT"}, "text": ", pages 1403-1409. IEEE, 2019. 3", "orig": ", pages 1403-1409. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "list_item", "bbox": {"l": 50.112, "t": 330.005, "r": 286.363, "b": 381.538, "coord_origin": "TOPLEFT"}, "confidence": 0.8567671179771423, "cells": [{"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 337.702, "r_x1": 65.05, "r_y1": 337.702, "r_x2": 65.05, "r_y2": 330.005, "r_x3": 50.112, "r_y3": 330.005, "coord_origin": "TOPLEFT"}, "text": "[30]", "orig": "[30]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 337.702, "r_x1": 286.359, "r_y1": 337.702, "r_x2": 286.359, "r_y2": 330.005, "r_x3": 70.035, "r_y3": 330.005, "coord_origin": "TOPLEFT"}, "text": "Peter WJ Staar, Michele Dolfi, Christoph Auer, and Costas", "orig": "Peter WJ Staar, Michele Dolfi, Christoph Auer, and Costas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 348.661, "r_x1": 286.363, "r_y1": 348.661, "r_x2": 286.363, "r_y2": 340.964, "r_x3": 70.031, "r_y3": 340.964, "coord_origin": "TOPLEFT"}, "text": "Bekas. Corpus conversion service: A machine learning plat-", "orig": "Bekas. Corpus conversion service: A machine learning plat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 359.62, "r_x1": 198.824, "r_y1": 359.62, "r_x2": 198.824, "r_y2": 351.923, "r_x3": 70.031, "r_y3": 351.923, "coord_origin": "TOPLEFT"}, "text": "form to ingest documents at scale.", "orig": "form to ingest documents at scale.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.06, "r_y0": 359.62, "r_x1": 213.529, "r_y1": 359.62, "r_x2": 213.529, "r_y2": 351.923, "r_x3": 206.06, "r_y3": 351.923, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.021, "r_y0": 359.491, "r_x1": 286.358, "r_y1": 359.491, "r_x2": 286.358, "r_y2": 351.761, "r_x3": 217.021, "r_y3": 351.761, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the", "orig": "Proceedings of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 370.45, "r_x1": 143.08, "r_y1": 370.45, "r_x2": 143.08, "r_y2": 362.72, "r_x3": 70.031, "r_y3": 362.72, "coord_origin": "TOPLEFT"}, "text": "24th ACM SIGKDD", "orig": "24th ACM SIGKDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.078, "r_y0": 370.579, "r_x1": 145.32, "r_y1": 370.579, "r_x2": 145.32, "r_y2": 362.882, "r_x3": 143.078, "r_y3": 362.882, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.108, "r_y0": 370.579, "r_x1": 286.361, "r_y1": 370.579, "r_x2": 286.361, "r_y2": 362.882, "r_x3": 148.108, "r_y3": 362.882, "coord_origin": "TOPLEFT"}, "text": "KDD '18, pages 774-782, New York,", "orig": "KDD '18, pages 774-782, New York,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 381.538, "r_x1": 161.157, "r_y1": 381.538, "r_x2": 161.157, "r_y2": 373.841, "r_x3": 70.031, "r_y3": 373.841, "coord_origin": "TOPLEFT"}, "text": "NY, USA, 2018. ACM. 1", "orig": "NY, USA, 2018. ACM. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "list_item", "bbox": {"l": 50.112, "t": 385.165, "r": 286.364, "b": 458.615, "coord_origin": "TOPLEFT"}, "confidence": 0.8832162618637085, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 392.862, "r_x1": 65.05, "r_y1": 392.862, "r_x2": 65.05, "r_y2": 385.165, "r_x3": 50.112, "r_y3": 385.165, "coord_origin": "TOPLEFT"}, "text": "[31]", "orig": "[31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 392.862, "r_x1": 286.359, "r_y1": 392.862, "r_x2": 286.359, "r_y2": 385.165, "r_x3": 70.035, "r_y3": 385.165, "coord_origin": "TOPLEFT"}, "text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 403.821, "r_x1": 84.225, "r_y1": 403.821, "r_x2": 84.225, "r_y2": 396.124, "r_x3": 70.031, "r_y3": 396.124, "coord_origin": "TOPLEFT"}, "text": "reit,", "orig": "reit,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.489, "r_y0": 403.821, "r_x1": 286.363, "r_y1": 403.821, "r_x2": 286.363, "r_y2": 396.124, "r_x3": 87.489, "r_y3": 396.124, "coord_origin": "TOPLEFT"}, "text": "Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "orig": "Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 414.78, "r_x1": 78.997, "r_y1": 414.78, "r_x2": 78.997, "r_y2": 407.083, "r_x3": 70.031, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "lia", "orig": "lia", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.871, "r_y0": 414.78, "r_x1": 125.47, "r_y1": 414.78, "r_x2": 125.47, "r_y2": 407.083, "r_x3": 82.871, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "Polosukhin.", "orig": "Polosukhin.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 133.908, "r_y0": 414.78, "r_x1": 167.783, "r_y1": 414.78, "r_x2": 167.783, "r_y2": 407.083, "r_x3": 133.908, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.656, "r_y0": 414.78, "r_x1": 177.637, "r_y1": 414.78, "r_x2": 177.637, "r_y2": 407.083, "r_x3": 171.656, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.51, "r_y0": 414.78, "r_x1": 190.477, "r_y1": 414.78, "r_x2": 190.477, "r_y2": 407.083, "r_x3": 181.51, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.341, "r_y0": 414.78, "r_x1": 230.834, "r_y1": 414.78, "r_x2": 230.834, "r_y2": 407.083, "r_x3": 194.341, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "you need.", "orig": "you need.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.272, "r_y0": 414.78, "r_x1": 246.741, "r_y1": 414.78, "r_x2": 246.741, "r_y2": 407.083, "r_x3": 239.272, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.614, "r_y0": 414.78, "r_x1": 255.842, "r_y1": 414.78, "r_x2": 255.842, "r_y2": 407.083, "r_x3": 250.614, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "I.", "orig": "I.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.715, "r_y0": 414.78, "r_x1": 286.363, "r_y1": 414.78, "r_x2": 286.363, "r_y2": 407.083, "r_x3": 259.715, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "Guyon,", "orig": "Guyon,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 425.739, "r_x1": 286.363, "r_y1": 425.739, "r_x2": 286.363, "r_y2": 418.042, "r_x3": 70.031, "r_y3": 418.042, "coord_origin": "TOPLEFT"}, "text": "U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "orig": "U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 436.697, "r_x1": 196.762, "r_y1": 436.697, "r_x2": 196.762, "r_y2": 429.0, "r_x3": 70.031, "r_y3": 429.0, "coord_origin": "TOPLEFT"}, "text": "wanathan, and R. Garnett, editors,", "orig": "wanathan, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.202, "r_y0": 436.568, "r_x1": 286.36, "r_y1": 436.568, "r_x2": 286.36, "r_y2": 428.838, "r_x3": 200.202, "r_y3": 428.838, "coord_origin": "TOPLEFT"}, "text": "Advances in Neural In-", "orig": "Advances in Neural In-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 447.527, "r_x1": 189.194, "r_y1": 447.527, "r_x2": 189.194, "r_y2": 439.797, "r_x3": 70.031, "r_y3": 439.797, "coord_origin": "TOPLEFT"}, "text": "formation Processing Systems 30", "orig": "formation Processing Systems 30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 189.195, "r_y0": 447.656, "r_x1": 191.437, "r_y1": 447.656, "r_x2": 191.437, "r_y2": 439.959, "r_x3": 189.195, "r_y3": 439.959, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.795, "r_y0": 447.656, "r_x1": 286.364, "r_y1": 447.656, "r_x2": 286.364, "r_y2": 439.959, "r_x3": 193.795, "r_y3": 439.959, "coord_origin": "TOPLEFT"}, "text": "pages 5998-6008. Curran", "orig": "pages 5998-6008. Curran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 458.615, "r_x1": 158.924, "r_y1": 458.615, "r_x2": 158.924, "r_y2": 450.918, "r_x3": 70.031, "r_y3": 450.918, "coord_origin": "TOPLEFT"}, "text": "Associates, Inc., 2017. 5", "orig": "Associates, Inc., 2017. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "list_item", "bbox": {"l": 50.112, "t": 462.242, "r": 286.363, "b": 502.816, "coord_origin": "TOPLEFT"}, "confidence": 0.8431925177574158, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 469.939, "r_x1": 65.05, "r_y1": 469.939, "r_x2": 65.05, "r_y2": 462.242, "r_x3": 50.112, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "[32]", "orig": "[32]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 469.939, "r_x1": 88.963, "r_y1": 469.939, "r_x2": 88.963, "r_y2": 462.242, "r_x3": 70.035, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "Oriol", "orig": "Oriol", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.81, "r_y0": 469.939, "r_x1": 122.274, "r_y1": 469.939, "r_x2": 122.274, "r_y2": 462.242, "r_x3": 92.81, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "Vinyals,", "orig": "Vinyals,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 126.524, "r_y0": 469.939, "r_x1": 194.695, "r_y1": 469.939, "r_x2": 194.695, "r_y2": 462.242, "r_x3": 126.524, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "Alexander Toshev,", "orig": "Alexander Toshev,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.954, "r_y0": 469.939, "r_x1": 286.359, "r_y1": 469.939, "r_x2": 286.359, "r_y2": 462.242, "r_x3": 198.954, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "Samy Bengio, and Du-", "orig": "Samy Bengio, and Du-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 480.898, "r_x1": 116.28, "r_y1": 480.898, "r_x2": 116.28, "r_y2": 473.201, "r_x3": 70.031, "r_y3": 473.201, "coord_origin": "TOPLEFT"}, "text": "mitru Erhan.", "orig": "mitru Erhan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.484, "r_y0": 480.898, "r_x1": 175.924, "r_y1": 480.898, "r_x2": 175.924, "r_y2": 473.201, "r_x3": 122.484, "r_y3": 473.201, "coord_origin": "TOPLEFT"}, "text": "Show and tell:", "orig": "Show and tell:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.56, "r_y0": 480.898, "r_x1": 286.363, "r_y1": 480.898, "r_x2": 286.363, "r_y2": 473.201, "r_x3": 180.56, "r_y3": 473.201, "coord_origin": "TOPLEFT"}, "text": "A neural image caption gen-", "orig": "A neural image caption gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 491.857, "r_x1": 103.305, "r_y1": 491.857, "r_x2": 103.305, "r_y2": 484.16, "r_x3": 70.031, "r_y3": 484.16, "coord_origin": "TOPLEFT"}, "text": "erator. In", "orig": "erator. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 105.516, "r_y0": 491.728, "r_x1": 286.359, "r_y1": 491.728, "r_x2": 286.359, "r_y2": 483.998, "r_x3": 105.516, "r_y3": 483.998, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE Conference on Computer", "orig": "Proceedings of the IEEE Conference on Computer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 502.687, "r_x1": 212.516, "r_y1": 502.687, "r_x2": 212.516, "r_y2": 494.957, "r_x3": 70.031, "r_y3": 494.957, "coord_origin": "TOPLEFT"}, "text": "Vision and Pattern Recognition (CVPR)", "orig": "Vision and Pattern Recognition (CVPR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.514, "r_y0": 502.816, "r_x1": 263.56, "r_y1": 502.816, "r_x2": 263.56, "r_y2": 495.119, "r_x3": 212.514, "r_y3": 495.119, "coord_origin": "TOPLEFT"}, "text": ", June 2015. 2", "orig": ", June 2015. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "list_item", "bbox": {"l": 50.112, "t": 506.443, "r": 286.363, "b": 547.016, "coord_origin": "TOPLEFT"}, "confidence": 0.8405635952949524, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 514.14, "r_x1": 65.05, "r_y1": 514.14, "r_x2": 65.05, "r_y2": 506.443, "r_x3": 50.112, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "[33]", "orig": "[33]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 514.14, "r_x1": 247.373, "r_y1": 514.14, "r_x2": 247.373, "r_y2": 506.443, "r_x3": 70.035, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 253.972, "r_y0": 514.14, "r_x1": 286.359, "r_y1": 514.14, "r_x2": 286.359, "r_y2": 506.443, "r_x3": 253.972, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "Res2tim:", "orig": "Res2tim:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 525.0989999999999, "r_x1": 253.125, "r_y1": 525.0989999999999, "r_x2": 253.125, "r_y2": 517.402, "r_x3": 70.031, "r_y3": 517.402, "coord_origin": "TOPLEFT"}, "text": "reconstruct syntactic structures from table images.", "orig": "reconstruct syntactic structures from table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 258.155, "r_y0": 525.0989999999999, "r_x1": 265.624, "r_y1": 525.0989999999999, "r_x2": 265.624, "r_y2": 517.402, "r_x3": 258.155, "r_y3": 517.402, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 268.429, "r_y0": 524.97, "r_x1": 286.362, "r_y1": 524.97, "r_x2": 286.362, "r_y2": 517.24, "r_x3": 268.429, "r_y3": 517.24, "coord_origin": "TOPLEFT"}, "text": "2019", "orig": "2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 535.929, "r_x1": 286.363, "r_y1": 535.929, "r_x2": 286.363, "r_y2": 528.1990000000001, "r_x3": 70.031, "r_y3": 528.1990000000001, "coord_origin": "TOPLEFT"}, "text": "International Conference on Document Analysis and Recog-", "orig": "International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 546.887, "r_x1": 125.255, "r_y1": 546.887, "r_x2": 125.255, "r_y2": 539.157, "r_x3": 70.031, "r_y3": 539.157, "coord_origin": "TOPLEFT"}, "text": "nition (ICDAR)", "orig": "nition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.254, "r_y0": 547.016, "r_x1": 240.051, "r_y1": 547.016, "r_x2": 240.051, "r_y2": 539.319, "r_x3": 125.254, "r_y3": 539.319, "coord_origin": "TOPLEFT"}, "text": ", pages 749-755. IEEE, 2019. 3", "orig": ", pages 749-755. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "list_item", "bbox": {"l": 50.112, "t": 550.643, "r": 286.363, "b": 591.217, "coord_origin": "TOPLEFT"}, "confidence": 0.8241521716117859, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 558.34, "r_x1": 65.05, "r_y1": 558.34, "r_x2": 65.05, "r_y2": 550.643, "r_x3": 50.112, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "[34]", "orig": "[34]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 558.34, "r_x1": 125.008, "r_y1": 558.34, "r_x2": 125.008, "r_y2": 550.643, "r_x3": 70.035, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "Wenyuan Xue,", "orig": "Wenyuan Xue,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.823, "r_y0": 558.34, "r_x1": 181.676, "r_y1": 558.34, "r_x2": 181.676, "r_y2": 550.643, "r_x3": 129.823, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "Baosheng Yu,", "orig": "Baosheng Yu,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 186.491, "r_y0": 558.34, "r_x1": 286.359, "r_y1": 558.34, "r_x2": 286.359, "r_y2": 550.643, "r_x3": 186.491, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "Wen Wang, Dacheng Tao,", "orig": "Wen Wang, Dacheng Tao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 569.299, "r_x1": 137.082, "r_y1": 569.299, "r_x2": 137.082, "r_y2": 561.602, "r_x3": 70.031, "r_y3": 561.602, "coord_origin": "TOPLEFT"}, "text": "and Qingyong Li.", "orig": "and Qingyong Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.985, "r_y0": 569.299, "r_x1": 172.382, "r_y1": 569.299, "r_x2": 172.382, "r_y2": 561.602, "r_x3": 145.985, "r_y3": 561.602, "coord_origin": "TOPLEFT"}, "text": "Tgrnet:", "orig": "Tgrnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.704, "r_y0": 569.299, "r_x1": 206.625, "r_y1": 569.299, "r_x2": 206.625, "r_y2": 561.602, "r_x3": 178.704, "r_y3": 561.602, "coord_origin": "TOPLEFT"}, "text": "A table", "orig": "A table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.633, "r_y0": 569.299, "r_x1": 286.363, "r_y1": 569.299, "r_x2": 286.363, "r_y2": 561.602, "r_x3": 210.633, "r_y3": 561.602, "coord_origin": "TOPLEFT"}, "text": "graph reconstruction", "orig": "graph reconstruction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 580.258, "r_x1": 99.324, "r_y1": 580.258, "r_x2": 99.324, "r_y2": 572.561, "r_x3": 70.031, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 104.157, "r_y0": 580.258, "r_x1": 114.612, "r_y1": 580.258, "r_x2": 114.612, "r_y2": 572.561, "r_x3": 104.157, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.454, "r_y0": 580.258, "r_x1": 136.884, "r_y1": 580.258, "r_x2": 136.884, "r_y2": 572.561, "r_x3": 119.454, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.717, "r_y0": 580.258, "r_x1": 173.091, "r_y1": 580.258, "r_x2": 173.091, "r_y2": 572.561, "r_x3": 141.717, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.933, "r_y0": 580.258, "r_x1": 221.007, "r_y1": 580.258, "r_x2": 221.007, "r_y2": 572.561, "r_x3": 177.933, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.543, "r_y0": 580.129, "r_x1": 252.466, "r_y1": 580.129, "r_x2": 252.466, "r_y2": 572.399, "r_x3": 232.543, "r_y3": 572.399, "coord_origin": "TOPLEFT"}, "text": "arXiv", "orig": "arXiv", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.299, "r_y0": 580.129, "r_x1": 286.359, "r_y1": 580.129, "r_x2": 286.359, "r_y2": 572.399, "r_x3": 257.299, "r_y3": 572.399, "coord_origin": "TOPLEFT"}, "text": "preprint", "orig": "preprint", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 591.088, "r_x1": 135.531, "r_y1": 591.088, "r_x2": 135.531, "r_y2": 583.358, "r_x3": 70.031, "r_y3": 583.358, "coord_origin": "TOPLEFT"}, "text": "arXiv:2106.10598", "orig": "arXiv:2106.10598", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 135.53, "r_y0": 591.217, "r_x1": 167.899, "r_y1": 591.217, "r_x2": 167.899, "r_y2": 583.52, "r_x3": 135.53, "r_y3": 583.52, "coord_origin": "TOPLEFT"}, "text": ", 2021. 3", "orig": ", 2021. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 10, "label": "list_item", "bbox": {"l": 50.112, "t": 594.844, "r": 286.363, "b": 635.418, "coord_origin": "TOPLEFT"}, "confidence": 0.8360886573791504, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 602.5409999999999, "r_x1": 65.05, "r_y1": 602.5409999999999, "r_x2": 65.05, "r_y2": 594.844, "r_x3": 50.112, "r_y3": 594.844, "coord_origin": "TOPLEFT"}, "text": "[35]", "orig": "[35]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 602.5409999999999, "r_x1": 286.359, "r_y1": 602.5409999999999, "r_x2": 286.359, "r_y2": 594.844, "r_x3": 70.035, "r_y3": 594.844, "coord_origin": "TOPLEFT"}, "text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 613.5, "r_x1": 109.107, "r_y1": 613.5, "r_x2": 109.107, "r_y2": 605.803, "r_x3": 70.031, "r_y3": 605.803, "coord_origin": "TOPLEFT"}, "text": "Jiebo Luo.", "orig": "Jiebo Luo.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.226, "r_y0": 613.5, "r_x1": 271.766, "r_y1": 613.5, "r_x2": 271.766, "r_y2": 605.803, "r_x3": 116.226, "r_y3": 605.803, "coord_origin": "TOPLEFT"}, "text": "Image captioning with semantic attention.", "orig": "Image captioning with semantic attention.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.894, "r_y0": 613.5, "r_x1": 286.363, "r_y1": 613.5, "r_x2": 286.363, "r_y2": 605.803, "r_x3": 278.894, "r_y3": 605.803, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 624.33, "r_x1": 286.363, "r_y1": 624.33, "r_x2": 286.363, "r_y2": 616.6, "r_x3": 70.031, "r_y3": 616.6, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE conference on computer vision and", "orig": "Proceedings of the IEEE conference on computer vision and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 635.289, "r_x1": 139.099, "r_y1": 635.289, "r_x2": 139.099, "r_y2": 627.559, "r_x3": 70.031, "r_y3": 627.559, "coord_origin": "TOPLEFT"}, "text": "pattern recognition", "orig": "pattern recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.098, "r_y0": 635.418, "r_x1": 238.957, "r_y1": 635.418, "r_x2": 238.957, "r_y2": 627.721, "r_x3": 139.098, "r_y3": 627.721, "coord_origin": "TOPLEFT"}, "text": ", pages 4651-4659, 2016. 4", "orig": ", pages 4651-4659, 2016. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "list_item", "bbox": {"l": 50.112, "t": 639.045, "r": 286.363, "b": 690.577, "coord_origin": "TOPLEFT"}, "confidence": 0.8079474568367004, "cells": [{"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 646.742, "r_x1": 65.05, "r_y1": 646.742, "r_x2": 65.05, "r_y2": 639.045, "r_x3": 50.112, "r_y3": 639.045, "coord_origin": "TOPLEFT"}, "text": "[36]", "orig": "[36]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 646.742, "r_x1": 286.359, "r_y1": 646.742, "r_x2": 286.359, "r_y2": 639.045, "r_x3": 70.035, "r_y3": 639.045, "coord_origin": "TOPLEFT"}, "text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 657.7, "r_x1": 286.363, "r_y1": 657.7, "r_x2": 286.363, "r_y2": 650.0029999999999, "r_x3": 70.031, "r_y3": 650.0029999999999, "coord_origin": "TOPLEFT"}, "text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 668.659, "r_x1": 286.363, "r_y1": 668.659, "r_x2": 286.363, "r_y2": 660.962, "r_x3": 70.031, "r_y3": 660.962, "coord_origin": "TOPLEFT"}, "text": "work for joint table identification and cell structure recogni-", "orig": "work for joint table identification and cell structure recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 679.6179999999999, "r_x1": 158.458, "r_y1": 679.6179999999999, "r_x2": 158.458, "r_y2": 671.921, "r_x3": 70.031, "r_y3": 671.921, "coord_origin": "TOPLEFT"}, "text": "tion using visual context.", "orig": "tion using visual context.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.528, "r_y0": 679.489, "r_x1": 286.362, "r_y1": 679.489, "r_x2": 286.362, "r_y2": 671.759, "r_x3": 160.528, "r_y3": 671.759, "coord_origin": "TOPLEFT"}, "text": "Winter Conference for Applications", "orig": "Winter Conference for Applications", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 690.448, "r_x1": 171.423, "r_y1": 690.448, "r_x2": 171.423, "r_y2": 682.718, "r_x3": 70.031, "r_y3": 682.718, "coord_origin": "TOPLEFT"}, "text": "in Computer Vision (WACV)", "orig": "in Computer Vision (WACV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.422, "r_y0": 690.577, "r_x1": 212.757, "r_y1": 690.577, "r_x2": 212.757, "r_y2": 682.88, "r_x3": 171.422, "r_y3": 682.88, "coord_origin": "TOPLEFT"}, "text": ", 2021. 2, 3", "orig": ", 2021. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "list_item", "bbox": {"l": 50.112, "t": 694.204, "r": 286.363, "b": 712.86, "coord_origin": "TOPLEFT"}, "confidence": 0.8385783433914185, "cells": [{"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.901, "r_x1": 65.05, "r_y1": 701.901, "r_x2": 65.05, "r_y2": 694.204, "r_x3": 50.112, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "[37]", "orig": "[37]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 701.901, "r_x1": 80.992, "r_y1": 701.901, "r_x2": 80.992, "r_y2": 694.204, "r_x3": 70.035, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Xu", "orig": "Xu", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 89.062, "r_y0": 701.901, "r_x1": 114.715, "r_y1": 701.901, "r_x2": 114.715, "r_y2": 694.204, "r_x3": 89.062, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Zhong,", "orig": "Zhong,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.246, "r_y0": 701.901, "r_x1": 149.146, "r_y1": 701.901, "r_x2": 149.146, "r_y2": 694.204, "r_x3": 124.246, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Elaheh", "orig": "Elaheh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.225, "r_y0": 701.901, "r_x1": 209.373, "r_y1": 701.901, "r_x2": 209.373, "r_y2": 694.204, "r_x3": 157.225, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "ShafieiBavani,", "orig": "ShafieiBavani,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 218.904, "r_y0": 701.901, "r_x1": 231.852, "r_y1": 701.901, "r_x2": 231.852, "r_y2": 694.204, "r_x3": 218.904, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.931, "r_y0": 701.901, "r_x1": 269.323, "r_y1": 701.901, "r_x2": 269.323, "r_y2": 694.204, "r_x3": 239.931, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Antonio", "orig": "Antonio", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 277.392, "r_y0": 701.901, "r_x1": 286.359, "r_y1": 701.901, "r_x2": 286.359, "r_y2": 694.204, "r_x3": 277.392, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Ji-", "orig": "Ji-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 712.86, "r_x1": 116.719, "r_y1": 712.86, "r_x2": 116.719, "r_y2": 705.163, "r_x3": 70.031, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "meno Yepes.", "orig": "meno Yepes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.413, "r_y0": 712.86, "r_x1": 235.013, "r_y1": 712.86, "r_x2": 235.013, "r_y2": 705.163, "r_x3": 122.413, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "Image-based table recognition:", "orig": "Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.335, "r_y0": 712.86, "r_x1": 286.363, "r_y1": 712.86, "r_x2": 286.363, "r_y2": 705.163, "r_x3": 239.335, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "Data, model,", "orig": "Data, model,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "list_item", "bbox": {"l": 328.781, "t": 76.12599999999998, "r": 545.115, "b": 116.69899999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.7556979060173035, "cells": [{"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 83.82299999999998, "r_x1": 383.646, "r_y1": 83.82299999999998, "r_x2": 383.646, "r_y2": 76.12599999999998, "r_x3": 328.781, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "and evaluation.", "orig": "and evaluation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 388.56, "r_y0": 83.82299999999998, "r_x1": 545.113, "r_y1": 83.82299999999998, "r_x2": 545.113, "r_y2": 76.12599999999998, "r_x3": 388.56, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "In Andrea Vedaldi, Horst Bischof, Thomas", "orig": "In Andrea Vedaldi, Horst Bischof, Thomas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 94.78099999999995, "r_x1": 472.306, "r_y1": 94.78099999999995, "r_x2": 472.306, "r_y2": 87.08399999999995, "r_x3": 328.781, "r_y3": 87.08399999999995, "coord_origin": "TOPLEFT"}, "text": "Brox, and Jan-Michael Frahm, editors,", "orig": "Brox, and Jan-Michael Frahm, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.885, "r_y0": 94.65200000000004, "r_x1": 545.115, "r_y1": 94.65200000000004, "r_x2": 545.115, "r_y2": 86.92200000000003, "r_x3": 475.885, "r_y3": 86.92200000000003, "coord_origin": "TOPLEFT"}, "text": "Computer Vision -", "orig": "Computer Vision -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 105.61099999999999, "r_x1": 371.927, "r_y1": 105.61099999999999, "r_x2": 371.927, "r_y2": 97.88099999999997, "r_x3": 328.781, "r_y3": 97.88099999999997, "coord_origin": "TOPLEFT"}, "text": "ECCV 2020", "orig": "ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 371.926, "r_y0": 105.74000000000001, "r_x1": 374.168, "r_y1": 105.74000000000001, "r_x2": 374.168, "r_y2": 98.043, "r_x3": 371.926, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.472, "r_y0": 105.74000000000001, "r_x1": 545.112, "r_y1": 105.74000000000001, "r_x2": 545.112, "r_y2": 98.043, "r_x3": 376.472, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "pages 564-580, Cham, 2020. Springer Interna-", "orig": "pages 564-580, Cham, 2020. Springer Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 116.69899999999996, "r_x1": 417.701, "r_y1": 116.69899999999996, "r_x2": 417.701, "r_y2": 109.00199999999995, "r_x3": 328.781, "r_y3": 109.00199999999995, "coord_origin": "TOPLEFT"}, "text": "tional Publishing. 2, 3, 7", "orig": "tional Publishing. 2, 3, 7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "list_item", "bbox": {"l": 308.862, "t": 120.957, "r": 545.113, "b": 161.53099999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.8375797271728516, "cells": [{"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 128.654, "r_x1": 323.8, "r_y1": 128.654, "r_x2": 323.8, "r_y2": 120.957, "r_x3": 308.862, "r_y3": 120.957, "coord_origin": "TOPLEFT"}, "text": "[38]", "orig": "[38]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 128.654, "r_x1": 523.15, "r_y1": 128.654, "r_x2": 523.15, "r_y2": 120.957, "r_x3": 328.785, "r_y3": 120.957, "coord_origin": "TOPLEFT"}, "text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes.", "orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.171, "r_y0": 128.654, "r_x1": 545.109, "r_y1": 128.654, "r_x2": 545.109, "r_y2": 120.957, "r_x3": 528.171, "r_y3": 120.957, "coord_origin": "TOPLEFT"}, "text": "Pub-", "orig": "Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 139.61300000000006, "r_x1": 545.113, "r_y1": 139.61300000000006, "r_x2": 545.113, "r_y2": 131.91600000000005, "r_x3": 328.781, "r_y3": 131.91600000000005, "coord_origin": "TOPLEFT"}, "text": "laynet: Largest dataset ever for document layout analysis. In", "orig": "laynet: Largest dataset ever for document layout analysis. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 150.44299999999998, "r_x1": 545.113, "r_y1": 150.44299999999998, "r_x2": 545.113, "r_y2": 142.71299999999997, "r_x3": 328.781, "r_y3": 142.71299999999997, "coord_origin": "TOPLEFT"}, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 161.40200000000004, "r_x1": 406.322, "r_y1": 161.40200000000004, "r_x2": 406.322, "r_y2": 153.67200000000003, "r_x3": 328.781, "r_y3": 153.67200000000003, "coord_origin": "TOPLEFT"}, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 406.322, "r_y0": 161.53099999999995, "r_x1": 506.181, "r_y1": 161.53099999999995, "r_x2": 506.181, "r_y2": 153.83399999999995, "r_x3": 406.322, "r_y3": 153.83399999999995, "coord_origin": "TOPLEFT"}, "text": ", pages 1015-1022, 2019. 1", "orig": ", pages 1015-1022, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "page_footer", "bbox": {"l": 292.63, "t": 734.402, "r": 302.593, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9069584012031555, "cells": [{"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.63, "r_y0": 742.954, "r_x1": 302.593, "r_y1": 742.954, "r_x2": 302.593, "r_y2": 734.402, "r_x3": 292.63, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "text", "id": 15, "page_no": 9, "cluster": {"id": 15, "label": "text", "bbox": {"l": 70.031, "t": 75.96400000000006, "r": 286.362, "b": 94.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.6886764168739319, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 83.69399999999996, "r_x1": 223.581, "r_y1": 83.69399999999996, "r_x2": 223.581, "r_y2": 75.96400000000006, "r_x3": 70.031, "r_y3": 75.96400000000006, "coord_origin": "TOPLEFT"}, "text": "Computer Vision and Pattern Recognition", "orig": "Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 223.579, "r_y0": 83.82299999999998, "r_x1": 225.821, "r_y1": 83.82299999999998, "r_x2": 225.821, "r_y2": 76.12599999999998, "r_x3": 223.579, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.183, "r_y0": 83.82299999999998, "r_x1": 286.362, "r_y1": 83.82299999999998, "r_x2": 286.362, "r_y2": 76.12599999999998, "r_x3": 229.183, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "pages 658-666,", "orig": "pages 658-666,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 94.78200000000004, "r_x1": 97.917, "r_y1": 94.78200000000004, "r_x2": 97.917, "r_y2": 87.08500000000004, "r_x3": 70.031, "r_y3": 87.08500000000004, "coord_origin": "TOPLEFT"}, "text": "2019. 6", "orig": "2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Computer Vision and Pattern Recognition , pages 658-666, 2019. 6"}, {"label": "list_item", "id": 13, "page_no": 9, "cluster": {"id": 13, "label": "list_item", "bbox": {"l": 50.112, "t": 98.40800000000002, "r": 286.366, "b": 160.89999999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.7723011374473572, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 106.10500000000002, "r_x1": 65.05, "r_y1": 106.10500000000002, "r_x2": 65.05, "r_y2": 98.40800000000002, "r_x3": 50.112, "r_y3": 98.40800000000002, "coord_origin": "TOPLEFT"}, "text": "[26]", "orig": "[26]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 106.10500000000002, "r_x1": 286.359, "r_y1": 106.10500000000002, "r_x2": 286.359, "r_y2": 98.40800000000002, "r_x3": 70.035, "r_y3": 98.40800000000002, "coord_origin": "TOPLEFT"}, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 117.06399999999996, "r_x1": 286.363, "r_y1": 117.06399999999996, "r_x2": 286.363, "r_y2": 109.36699999999996, "r_x3": 70.031, "r_y3": 109.36699999999996, "coord_origin": "TOPLEFT"}, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 128.02300000000002, "r_x1": 286.363, "r_y1": 128.02300000000002, "r_x2": 286.363, "r_y2": 120.32600000000002, "r_x3": 70.031, "r_y3": 120.32600000000002, "coord_origin": "TOPLEFT"}, "text": "tion and structure recognition of tables in document images.", "orig": "tion and structure recognition of tables in document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 138.98199999999997, "r_x1": 77.5, "r_y1": 138.98199999999997, "r_x2": 77.5, "r_y2": 131.28499999999997, "r_x3": 70.031, "r_y3": 131.28499999999997, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 80.56, "r_y0": 138.85299999999995, "r_x1": 286.366, "r_y1": 138.85299999999995, "r_x2": 286.366, "r_y2": 131.12300000000005, "r_x3": 80.56, "r_y3": 131.12300000000005, "coord_origin": "TOPLEFT"}, "text": "2017 14th IAPR International Conference on Document", "orig": "2017 14th IAPR International Conference on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 149.812, "r_x1": 195.229, "r_y1": 149.812, "r_x2": 195.229, "r_y2": 142.082, "r_x3": 70.031, "r_y3": 142.082, "coord_origin": "TOPLEFT"}, "text": "Analysis and Recognition (ICDAR)", "orig": "Analysis and Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.231, "r_y0": 149.94100000000003, "r_x1": 286.365, "r_y1": 149.94100000000003, "r_x2": 286.365, "r_y2": 142.24400000000003, "r_x3": 195.231, "r_y3": 142.24400000000003, "coord_origin": "TOPLEFT"}, "text": ", volume 01, pages 1162-", "orig": ", volume 01, pages 1162-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 160.89999999999998, "r_x1": 120.333, "r_y1": 160.89999999999998, "r_x2": 120.333, "r_y2": 153.20299999999997, "r_x3": 70.031, "r_y3": 153.20299999999997, "coord_origin": "TOPLEFT"}, "text": "1167, 2017. 1", "orig": "1167, 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[26] Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Dengel, and Sheraz Ahmed. Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR) , volume 01, pages 11621167, 2017. 1"}, {"label": "list_item", "id": 2, "page_no": 9, "cluster": {"id": 2, "label": "list_item", "bbox": {"l": 50.112, "t": 164.52700000000004, "r": 286.363, "b": 227.01800000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.8580600619316101, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 172.22400000000005, "r_x1": 65.05, "r_y1": 172.22400000000005, "r_x2": 65.05, "r_y2": 164.52700000000004, "r_x3": 50.112, "r_y3": 164.52700000000004, "coord_origin": "TOPLEFT"}, "text": "[27]", "orig": "[27]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 172.22400000000005, "r_x1": 286.359, "r_y1": 172.22400000000005, "r_x2": 286.359, "r_y2": 164.52700000000004, "r_x3": 70.035, "r_y3": 164.52700000000004, "coord_origin": "TOPLEFT"}, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 183.183, "r_x1": 158.395, "r_y1": 183.183, "r_x2": 158.395, "r_y2": 175.486, "r_x3": 70.031, "r_y3": 175.486, "coord_origin": "TOPLEFT"}, "text": "gel, and Sheraz Ahmed.", "orig": "gel, and Sheraz Ahmed.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.035, "r_y0": 183.183, "r_x1": 202.877, "r_y1": 183.183, "r_x2": 202.877, "r_y2": 175.486, "r_x3": 164.035, "r_y3": 175.486, "coord_origin": "TOPLEFT"}, "text": "Deepdesrt:", "orig": "Deepdesrt:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.163, "r_y0": 183.183, "r_x1": 286.363, "r_y1": 183.183, "r_x2": 286.363, "r_y2": 175.486, "r_x3": 207.163, "r_y3": 175.486, "coord_origin": "TOPLEFT"}, "text": "Deep learning for de-", "orig": "Deep learning for de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 194.14200000000005, "r_x1": 286.363, "r_y1": 194.14200000000005, "r_x2": 286.363, "r_y2": 186.44500000000005, "r_x3": 70.031, "r_y3": 186.44500000000005, "coord_origin": "TOPLEFT"}, "text": "tection and structure recognition of tables in document im-", "orig": "tection and structure recognition of tables in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 205.101, "r_x1": 88.206, "r_y1": 205.101, "r_x2": 88.206, "r_y2": 197.404, "r_x3": 70.031, "r_y3": 197.404, "coord_origin": "TOPLEFT"}, "text": "ages.", "orig": "ages.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.864, "r_y0": 205.101, "r_x1": 101.333, "r_y1": 205.101, "r_x2": 101.333, "r_y2": 197.404, "r_x3": 93.864, "r_y3": 197.404, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 104.331, "r_y0": 204.97199999999998, "r_x1": 286.358, "r_y1": 204.97199999999998, "r_x2": 286.358, "r_y2": 197.24199999999996, "r_x3": 104.331, "r_y3": 197.24199999999996, "coord_origin": "TOPLEFT"}, "text": "2017 14th IAPR international conference on doc-", "orig": "2017 14th IAPR international conference on doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 215.92999999999995, "r_x1": 220.487, "r_y1": 215.92999999999995, "r_x2": 220.487, "r_y2": 208.20000000000005, "r_x3": 70.031, "r_y3": 208.20000000000005, "coord_origin": "TOPLEFT"}, "text": "ument analysis and recognition (ICDAR)", "orig": "ument analysis and recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.484, "r_y0": 216.05899999999997, "r_x1": 222.726, "r_y1": 216.05899999999997, "r_x2": 222.726, "r_y2": 208.36199999999997, "r_x3": 220.484, "r_y3": 208.36199999999997, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 225.909, "r_y0": 216.05899999999997, "r_x1": 286.36, "r_y1": 216.05899999999997, "r_x2": 286.36, "r_y2": 208.36199999999997, "r_x3": 225.909, "r_y3": 208.36199999999997, "coord_origin": "TOPLEFT"}, "text": "volume 1, pages", "orig": "volume 1, pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 227.01800000000003, "r_x1": 166.653, "r_y1": 227.01800000000003, "r_x2": 166.653, "r_y2": 219.32100000000003, "r_x3": 70.031, "r_y3": 219.32100000000003, "coord_origin": "TOPLEFT"}, "text": "1162-1167. IEEE, 2017. 3", "orig": "1162-1167. IEEE, 2017. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[27] Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Dengel, and Sheraz Ahmed. Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR international conference on document analysis and recognition (ICDAR) , volume 1, pages 1162-1167. IEEE, 2017. 3"}, {"label": "list_item", "id": 4, "page_no": 9, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 50.112, "t": 230.64499999999998, "r": 286.366, "b": 271.21900000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.8512731194496155, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 238.34199999999998, "r_x1": 65.05, "r_y1": 238.34199999999998, "r_x2": 65.05, "r_y2": 230.64499999999998, "r_x3": 50.112, "r_y3": 230.64499999999998, "coord_origin": "TOPLEFT"}, "text": "[28]", "orig": "[28]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 238.34199999999998, "r_x1": 179.147, "r_y1": 238.34199999999998, "r_x2": 179.147, "r_y2": 230.64499999999998, "r_x3": 70.035, "r_y3": 230.64499999999998, "coord_origin": "TOPLEFT"}, "text": "Faisal Shafait and Ray Smith.", "orig": "Faisal Shafait and Ray Smith.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.366, "r_y0": 238.34199999999998, "r_x1": 286.359, "r_y1": 238.34199999999998, "r_x2": 286.359, "r_y2": 230.64499999999998, "r_x3": 184.366, "r_y3": 230.64499999999998, "coord_origin": "TOPLEFT"}, "text": "Table detection in heteroge-", "orig": "Table detection in heteroge-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 249.30100000000004, "r_x1": 134.804, "r_y1": 249.30100000000004, "r_x2": 134.804, "r_y2": 241.60400000000004, "r_x3": 70.031, "r_y3": 241.60400000000004, "coord_origin": "TOPLEFT"}, "text": "neous documents.", "orig": "neous documents.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.7, "r_y0": 249.30100000000004, "r_x1": 147.169, "r_y1": 249.30100000000004, "r_x2": 147.169, "r_y2": 241.60400000000004, "r_x3": 139.7, "r_y3": 241.60400000000004, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.933, "r_y0": 249.17200000000003, "r_x1": 286.366, "r_y1": 249.17200000000003, "r_x2": 286.366, "r_y2": 241.442, "r_x3": 149.933, "r_y3": 241.442, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the 9th IAPR Interna-", "orig": "Proceedings of the 9th IAPR Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 260.131, "r_x1": 244.688, "r_y1": 260.131, "r_x2": 244.688, "r_y2": 252.40099999999995, "r_x3": 70.031, "r_y3": 252.40099999999995, "coord_origin": "TOPLEFT"}, "text": "tional Workshop on Document Analysis Systems", "orig": "tional Workshop on Document Analysis Systems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 244.691, "r_y0": 260.26, "r_x1": 246.933, "r_y1": 260.26, "r_x2": 246.933, "r_y2": 252.563, "r_x3": 244.691, "r_y3": 252.563, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.775, "r_y0": 260.26, "r_x1": 286.358, "r_y1": 260.26, "r_x2": 286.358, "r_y2": 252.563, "r_x3": 249.775, "r_y3": 252.563, "coord_origin": "TOPLEFT"}, "text": "pages 65-", "orig": "pages 65-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 271.21900000000005, "r_x1": 111.366, "r_y1": 271.21900000000005, "r_x2": 111.366, "r_y2": 263.52200000000005, "r_x3": 70.031, "r_y3": 263.52200000000005, "coord_origin": "TOPLEFT"}, "text": "72, 2010. 2", "orig": "72, 2010. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[28] Faisal Shafait and Ray Smith. Table detection in heterogeneous documents. In Proceedings of the 9th IAPR International Workshop on Document Analysis Systems , pages 6572, 2010. 2"}, {"label": "list_item", "id": 5, "page_no": 9, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 50.112, "t": 274.846, "r": 286.366, "b": 326.378, "coord_origin": "TOPLEFT"}, "confidence": 0.8494512438774109, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 282.543, "r_x1": 65.05, "r_y1": 282.543, "r_x2": 65.05, "r_y2": 274.846, "r_x3": 50.112, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "[29]", "orig": "[29]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 282.543, "r_x1": 94.944, "r_y1": 282.543, "r_x2": 94.944, "r_y2": 274.846, "r_x3": 70.035, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Shoaib", "orig": "Shoaib", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 100.871, "r_y0": 282.543, "r_x1": 127.268, "r_y1": 282.543, "r_x2": 127.268, "r_y2": 274.846, "r_x3": 100.871, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Ahmed", "orig": "Ahmed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 133.195, "r_y0": 282.543, "r_x1": 165.832, "r_y1": 282.543, "r_x2": 165.832, "r_y2": 274.846, "r_x3": 133.195, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Siddiqui,", "orig": "Siddiqui,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.683, "r_y0": 282.543, "r_x1": 194.094, "r_y1": 282.543, "r_x2": 194.094, "r_y2": 274.846, "r_x3": 172.683, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Imran", "orig": "Imran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.021, "r_y0": 282.543, "r_x1": 211.48, "r_y1": 282.543, "r_x2": 211.48, "r_y2": 274.846, "r_x3": 200.021, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Ali", "orig": "Ali", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.407, "r_y0": 282.543, "r_x1": 239.438, "r_y1": 282.543, "r_x2": 239.438, "r_y2": 274.846, "r_x3": 217.407, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Fateh,", "orig": "Fateh,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.288, "r_y0": 282.543, "r_x1": 264.221, "r_y1": 282.543, "r_x2": 264.221, "r_y2": 274.846, "r_x3": 246.288, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Syed", "orig": "Syed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.147, "r_y0": 282.543, "r_x1": 286.359, "r_y1": 282.543, "r_x2": 286.359, "r_y2": 274.846, "r_x3": 270.147, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Tah-", "orig": "Tah-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 293.502, "r_x1": 85.964, "r_y1": 293.502, "r_x2": 85.964, "r_y2": 285.805, "r_x3": 70.031, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "seen", "orig": "seen", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.021, "r_y0": 293.502, "r_x1": 108.945, "r_y1": 293.502, "r_x2": 108.945, "r_y2": 285.805, "r_x3": 91.021, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Raza", "orig": "Raza", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 114.002, "r_y0": 293.502, "r_x1": 135.674, "r_y1": 293.502, "r_x2": 135.674, "r_y2": 285.805, "r_x3": 114.002, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Rizvi,", "orig": "Rizvi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.43, "r_y0": 293.502, "r_x1": 171.306, "r_y1": 293.502, "r_x2": 171.306, "r_y2": 285.805, "r_x3": 141.43, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Andreas", "orig": "Andreas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.364, "r_y0": 293.502, "r_x1": 204.5, "r_y1": 293.502, "r_x2": 204.5, "r_y2": 285.805, "r_x3": 176.364, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Dengel,", "orig": "Dengel,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.265, "r_y0": 293.502, "r_x1": 223.213, "r_y1": 293.502, "r_x2": 223.213, "r_y2": 285.805, "r_x3": 210.265, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.27, "r_y0": 293.502, "r_x1": 252.668, "r_y1": 293.502, "r_x2": 252.668, "r_y2": 285.805, "r_x3": 228.27, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Sheraz", "orig": "Sheraz", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.725, "r_y0": 293.502, "r_x1": 286.363, "r_y1": 293.502, "r_x2": 286.363, "r_y2": 285.805, "r_x3": 257.725, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Ahmed.", "orig": "Ahmed.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 304.461, "r_x1": 286.363, "r_y1": 304.461, "r_x2": 286.363, "r_y2": 296.764, "r_x3": 70.031, "r_y3": 296.764, "coord_origin": "TOPLEFT"}, "text": "Deeptabstr: Deep learning based table structure recognition.", "orig": "Deeptabstr: Deep learning based table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 315.42, "r_x1": 77.5, "r_y1": 315.42, "r_x2": 77.5, "r_y2": 307.723, "r_x3": 70.031, "r_y3": 307.723, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 79.35, "r_y0": 315.291, "r_x1": 286.366, "r_y1": 315.291, "r_x2": 286.366, "r_y2": 307.561, "r_x3": 79.35, "r_y3": 307.561, "coord_origin": "TOPLEFT"}, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 326.249, "r_x1": 147.572, "r_y1": 326.249, "r_x2": 147.572, "r_y2": 318.519, "r_x3": 70.031, "r_y3": 318.519, "coord_origin": "TOPLEFT"}, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.572, "r_y0": 326.378, "r_x1": 271.335, "r_y1": 326.378, "r_x2": 271.335, "r_y2": 318.681, "r_x3": 147.572, "r_y3": 318.681, "coord_origin": "TOPLEFT"}, "text": ", pages 1403-1409. IEEE, 2019. 3", "orig": ", pages 1403-1409. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[29] Shoaib Ahmed Siddiqui, Imran Ali Fateh, Syed Tahseen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed. Deeptabstr: Deep learning based table structure recognition. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 1403-1409. IEEE, 2019. 3"}, {"label": "list_item", "id": 3, "page_no": 9, "cluster": {"id": 3, "label": "list_item", "bbox": {"l": 50.112, "t": 330.005, "r": 286.363, "b": 381.538, "coord_origin": "TOPLEFT"}, "confidence": 0.8567671179771423, "cells": [{"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 337.702, "r_x1": 65.05, "r_y1": 337.702, "r_x2": 65.05, "r_y2": 330.005, "r_x3": 50.112, "r_y3": 330.005, "coord_origin": "TOPLEFT"}, "text": "[30]", "orig": "[30]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 337.702, "r_x1": 286.359, "r_y1": 337.702, "r_x2": 286.359, "r_y2": 330.005, "r_x3": 70.035, "r_y3": 330.005, "coord_origin": "TOPLEFT"}, "text": "Peter WJ Staar, Michele Dolfi, Christoph Auer, and Costas", "orig": "Peter WJ Staar, Michele Dolfi, Christoph Auer, and Costas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 348.661, "r_x1": 286.363, "r_y1": 348.661, "r_x2": 286.363, "r_y2": 340.964, "r_x3": 70.031, "r_y3": 340.964, "coord_origin": "TOPLEFT"}, "text": "Bekas. Corpus conversion service: A machine learning plat-", "orig": "Bekas. Corpus conversion service: A machine learning plat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 359.62, "r_x1": 198.824, "r_y1": 359.62, "r_x2": 198.824, "r_y2": 351.923, "r_x3": 70.031, "r_y3": 351.923, "coord_origin": "TOPLEFT"}, "text": "form to ingest documents at scale.", "orig": "form to ingest documents at scale.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.06, "r_y0": 359.62, "r_x1": 213.529, "r_y1": 359.62, "r_x2": 213.529, "r_y2": 351.923, "r_x3": 206.06, "r_y3": 351.923, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.021, "r_y0": 359.491, "r_x1": 286.358, "r_y1": 359.491, "r_x2": 286.358, "r_y2": 351.761, "r_x3": 217.021, "r_y3": 351.761, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the", "orig": "Proceedings of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 370.45, "r_x1": 143.08, "r_y1": 370.45, "r_x2": 143.08, "r_y2": 362.72, "r_x3": 70.031, "r_y3": 362.72, "coord_origin": "TOPLEFT"}, "text": "24th ACM SIGKDD", "orig": "24th ACM SIGKDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.078, "r_y0": 370.579, "r_x1": 145.32, "r_y1": 370.579, "r_x2": 145.32, "r_y2": 362.882, "r_x3": 143.078, "r_y3": 362.882, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.108, "r_y0": 370.579, "r_x1": 286.361, "r_y1": 370.579, "r_x2": 286.361, "r_y2": 362.882, "r_x3": 148.108, "r_y3": 362.882, "coord_origin": "TOPLEFT"}, "text": "KDD '18, pages 774-782, New York,", "orig": "KDD '18, pages 774-782, New York,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 381.538, "r_x1": 161.157, "r_y1": 381.538, "r_x2": 161.157, "r_y2": 373.841, "r_x3": 70.031, "r_y3": 373.841, "coord_origin": "TOPLEFT"}, "text": "NY, USA, 2018. ACM. 1", "orig": "NY, USA, 2018. ACM. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[30] Peter WJ Staar, Michele Dolfi, Christoph Auer, and Costas Bekas. Corpus conversion service: A machine learning platform to ingest documents at scale. In Proceedings of the 24th ACM SIGKDD , KDD '18, pages 774-782, New York, NY, USA, 2018. ACM. 1"}, {"label": "list_item", "id": 1, "page_no": 9, "cluster": {"id": 1, "label": "list_item", "bbox": {"l": 50.112, "t": 385.165, "r": 286.364, "b": 458.615, "coord_origin": "TOPLEFT"}, "confidence": 0.8832162618637085, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 392.862, "r_x1": 65.05, "r_y1": 392.862, "r_x2": 65.05, "r_y2": 385.165, "r_x3": 50.112, "r_y3": 385.165, "coord_origin": "TOPLEFT"}, "text": "[31]", "orig": "[31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 392.862, "r_x1": 286.359, "r_y1": 392.862, "r_x2": 286.359, "r_y2": 385.165, "r_x3": 70.035, "r_y3": 385.165, "coord_origin": "TOPLEFT"}, "text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 403.821, "r_x1": 84.225, "r_y1": 403.821, "r_x2": 84.225, "r_y2": 396.124, "r_x3": 70.031, "r_y3": 396.124, "coord_origin": "TOPLEFT"}, "text": "reit,", "orig": "reit,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.489, "r_y0": 403.821, "r_x1": 286.363, "r_y1": 403.821, "r_x2": 286.363, "r_y2": 396.124, "r_x3": 87.489, "r_y3": 396.124, "coord_origin": "TOPLEFT"}, "text": "Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "orig": "Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 414.78, "r_x1": 78.997, "r_y1": 414.78, "r_x2": 78.997, "r_y2": 407.083, "r_x3": 70.031, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "lia", "orig": "lia", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.871, "r_y0": 414.78, "r_x1": 125.47, "r_y1": 414.78, "r_x2": 125.47, "r_y2": 407.083, "r_x3": 82.871, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "Polosukhin.", "orig": "Polosukhin.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 133.908, "r_y0": 414.78, "r_x1": 167.783, "r_y1": 414.78, "r_x2": 167.783, "r_y2": 407.083, "r_x3": 133.908, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.656, "r_y0": 414.78, "r_x1": 177.637, "r_y1": 414.78, "r_x2": 177.637, "r_y2": 407.083, "r_x3": 171.656, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.51, "r_y0": 414.78, "r_x1": 190.477, "r_y1": 414.78, "r_x2": 190.477, "r_y2": 407.083, "r_x3": 181.51, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.341, "r_y0": 414.78, "r_x1": 230.834, "r_y1": 414.78, "r_x2": 230.834, "r_y2": 407.083, "r_x3": 194.341, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "you need.", "orig": "you need.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.272, "r_y0": 414.78, "r_x1": 246.741, "r_y1": 414.78, "r_x2": 246.741, "r_y2": 407.083, "r_x3": 239.272, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.614, "r_y0": 414.78, "r_x1": 255.842, "r_y1": 414.78, "r_x2": 255.842, "r_y2": 407.083, "r_x3": 250.614, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "I.", "orig": "I.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.715, "r_y0": 414.78, "r_x1": 286.363, "r_y1": 414.78, "r_x2": 286.363, "r_y2": 407.083, "r_x3": 259.715, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "Guyon,", "orig": "Guyon,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 425.739, "r_x1": 286.363, "r_y1": 425.739, "r_x2": 286.363, "r_y2": 418.042, "r_x3": 70.031, "r_y3": 418.042, "coord_origin": "TOPLEFT"}, "text": "U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "orig": "U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 436.697, "r_x1": 196.762, "r_y1": 436.697, "r_x2": 196.762, "r_y2": 429.0, "r_x3": 70.031, "r_y3": 429.0, "coord_origin": "TOPLEFT"}, "text": "wanathan, and R. Garnett, editors,", "orig": "wanathan, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.202, "r_y0": 436.568, "r_x1": 286.36, "r_y1": 436.568, "r_x2": 286.36, "r_y2": 428.838, "r_x3": 200.202, "r_y3": 428.838, "coord_origin": "TOPLEFT"}, "text": "Advances in Neural In-", "orig": "Advances in Neural In-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 447.527, "r_x1": 189.194, "r_y1": 447.527, "r_x2": 189.194, "r_y2": 439.797, "r_x3": 70.031, "r_y3": 439.797, "coord_origin": "TOPLEFT"}, "text": "formation Processing Systems 30", "orig": "formation Processing Systems 30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 189.195, "r_y0": 447.656, "r_x1": 191.437, "r_y1": 447.656, "r_x2": 191.437, "r_y2": 439.959, "r_x3": 189.195, "r_y3": 439.959, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.795, "r_y0": 447.656, "r_x1": 286.364, "r_y1": 447.656, "r_x2": 286.364, "r_y2": 439.959, "r_x3": 193.795, "r_y3": 439.959, "coord_origin": "TOPLEFT"}, "text": "pages 5998-6008. Curran", "orig": "pages 5998-6008. Curran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 458.615, "r_x1": 158.924, "r_y1": 458.615, "r_x2": 158.924, "r_y2": 450.918, "r_x3": 70.031, "r_y3": 450.918, "coord_origin": "TOPLEFT"}, "text": "Associates, Inc., 2017. 5", "orig": "Associates, Inc., 2017. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[31] Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Illia Polosukhin. Attention is all you need. In I. Guyon, U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vishwanathan, and R. Garnett, editors, Advances in Neural Information Processing Systems 30 , pages 5998-6008. Curran Associates, Inc., 2017. 5"}, {"label": "list_item", "id": 6, "page_no": 9, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 50.112, "t": 462.242, "r": 286.363, "b": 502.816, "coord_origin": "TOPLEFT"}, "confidence": 0.8431925177574158, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 469.939, "r_x1": 65.05, "r_y1": 469.939, "r_x2": 65.05, "r_y2": 462.242, "r_x3": 50.112, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "[32]", "orig": "[32]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 469.939, "r_x1": 88.963, "r_y1": 469.939, "r_x2": 88.963, "r_y2": 462.242, "r_x3": 70.035, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "Oriol", "orig": "Oriol", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.81, "r_y0": 469.939, "r_x1": 122.274, "r_y1": 469.939, "r_x2": 122.274, "r_y2": 462.242, "r_x3": 92.81, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "Vinyals,", "orig": "Vinyals,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 126.524, "r_y0": 469.939, "r_x1": 194.695, "r_y1": 469.939, "r_x2": 194.695, "r_y2": 462.242, "r_x3": 126.524, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "Alexander Toshev,", "orig": "Alexander Toshev,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.954, "r_y0": 469.939, "r_x1": 286.359, "r_y1": 469.939, "r_x2": 286.359, "r_y2": 462.242, "r_x3": 198.954, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "Samy Bengio, and Du-", "orig": "Samy Bengio, and Du-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 480.898, "r_x1": 116.28, "r_y1": 480.898, "r_x2": 116.28, "r_y2": 473.201, "r_x3": 70.031, "r_y3": 473.201, "coord_origin": "TOPLEFT"}, "text": "mitru Erhan.", "orig": "mitru Erhan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.484, "r_y0": 480.898, "r_x1": 175.924, "r_y1": 480.898, "r_x2": 175.924, "r_y2": 473.201, "r_x3": 122.484, "r_y3": 473.201, "coord_origin": "TOPLEFT"}, "text": "Show and tell:", "orig": "Show and tell:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.56, "r_y0": 480.898, "r_x1": 286.363, "r_y1": 480.898, "r_x2": 286.363, "r_y2": 473.201, "r_x3": 180.56, "r_y3": 473.201, "coord_origin": "TOPLEFT"}, "text": "A neural image caption gen-", "orig": "A neural image caption gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 491.857, "r_x1": 103.305, "r_y1": 491.857, "r_x2": 103.305, "r_y2": 484.16, "r_x3": 70.031, "r_y3": 484.16, "coord_origin": "TOPLEFT"}, "text": "erator. In", "orig": "erator. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 105.516, "r_y0": 491.728, "r_x1": 286.359, "r_y1": 491.728, "r_x2": 286.359, "r_y2": 483.998, "r_x3": 105.516, "r_y3": 483.998, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE Conference on Computer", "orig": "Proceedings of the IEEE Conference on Computer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 502.687, "r_x1": 212.516, "r_y1": 502.687, "r_x2": 212.516, "r_y2": 494.957, "r_x3": 70.031, "r_y3": 494.957, "coord_origin": "TOPLEFT"}, "text": "Vision and Pattern Recognition (CVPR)", "orig": "Vision and Pattern Recognition (CVPR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.514, "r_y0": 502.816, "r_x1": 263.56, "r_y1": 502.816, "r_x2": 263.56, "r_y2": 495.119, "r_x3": 212.514, "r_y3": 495.119, "coord_origin": "TOPLEFT"}, "text": ", June 2015. 2", "orig": ", June 2015. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[32] Oriol Vinyals, Alexander Toshev, Samy Bengio, and Dumitru Erhan. Show and tell: A neural image caption generator. In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) , June 2015. 2"}, {"label": "list_item", "id": 7, "page_no": 9, "cluster": {"id": 7, "label": "list_item", "bbox": {"l": 50.112, "t": 506.443, "r": 286.363, "b": 547.016, "coord_origin": "TOPLEFT"}, "confidence": 0.8405635952949524, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 514.14, "r_x1": 65.05, "r_y1": 514.14, "r_x2": 65.05, "r_y2": 506.443, "r_x3": 50.112, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "[33]", "orig": "[33]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 514.14, "r_x1": 247.373, "r_y1": 514.14, "r_x2": 247.373, "r_y2": 506.443, "r_x3": 70.035, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 253.972, "r_y0": 514.14, "r_x1": 286.359, "r_y1": 514.14, "r_x2": 286.359, "r_y2": 506.443, "r_x3": 253.972, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "Res2tim:", "orig": "Res2tim:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 525.0989999999999, "r_x1": 253.125, "r_y1": 525.0989999999999, "r_x2": 253.125, "r_y2": 517.402, "r_x3": 70.031, "r_y3": 517.402, "coord_origin": "TOPLEFT"}, "text": "reconstruct syntactic structures from table images.", "orig": "reconstruct syntactic structures from table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 258.155, "r_y0": 525.0989999999999, "r_x1": 265.624, "r_y1": 525.0989999999999, "r_x2": 265.624, "r_y2": 517.402, "r_x3": 258.155, "r_y3": 517.402, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 268.429, "r_y0": 524.97, "r_x1": 286.362, "r_y1": 524.97, "r_x2": 286.362, "r_y2": 517.24, "r_x3": 268.429, "r_y3": 517.24, "coord_origin": "TOPLEFT"}, "text": "2019", "orig": "2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 535.929, "r_x1": 286.363, "r_y1": 535.929, "r_x2": 286.363, "r_y2": 528.1990000000001, "r_x3": 70.031, "r_y3": 528.1990000000001, "coord_origin": "TOPLEFT"}, "text": "International Conference on Document Analysis and Recog-", "orig": "International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 546.887, "r_x1": 125.255, "r_y1": 546.887, "r_x2": 125.255, "r_y2": 539.157, "r_x3": 70.031, "r_y3": 539.157, "coord_origin": "TOPLEFT"}, "text": "nition (ICDAR)", "orig": "nition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.254, "r_y0": 547.016, "r_x1": 240.051, "r_y1": 547.016, "r_x2": 240.051, "r_y2": 539.319, "r_x3": 125.254, "r_y3": 539.319, "coord_origin": "TOPLEFT"}, "text": ", pages 749-755. IEEE, 2019. 3", "orig": ", pages 749-755. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[33] Wenyuan Xue, Qingyong Li, and Dacheng Tao. Res2tim: reconstruct syntactic structures from table images. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 749-755. IEEE, 2019. 3"}, {"label": "list_item", "id": 11, "page_no": 9, "cluster": {"id": 11, "label": "list_item", "bbox": {"l": 50.112, "t": 550.643, "r": 286.363, "b": 591.217, "coord_origin": "TOPLEFT"}, "confidence": 0.8241521716117859, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 558.34, "r_x1": 65.05, "r_y1": 558.34, "r_x2": 65.05, "r_y2": 550.643, "r_x3": 50.112, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "[34]", "orig": "[34]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 558.34, "r_x1": 125.008, "r_y1": 558.34, "r_x2": 125.008, "r_y2": 550.643, "r_x3": 70.035, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "Wenyuan Xue,", "orig": "Wenyuan Xue,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.823, "r_y0": 558.34, "r_x1": 181.676, "r_y1": 558.34, "r_x2": 181.676, "r_y2": 550.643, "r_x3": 129.823, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "Baosheng Yu,", "orig": "Baosheng Yu,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 186.491, "r_y0": 558.34, "r_x1": 286.359, "r_y1": 558.34, "r_x2": 286.359, "r_y2": 550.643, "r_x3": 186.491, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "Wen Wang, Dacheng Tao,", "orig": "Wen Wang, Dacheng Tao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 569.299, "r_x1": 137.082, "r_y1": 569.299, "r_x2": 137.082, "r_y2": 561.602, "r_x3": 70.031, "r_y3": 561.602, "coord_origin": "TOPLEFT"}, "text": "and Qingyong Li.", "orig": "and Qingyong Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.985, "r_y0": 569.299, "r_x1": 172.382, "r_y1": 569.299, "r_x2": 172.382, "r_y2": 561.602, "r_x3": 145.985, "r_y3": 561.602, "coord_origin": "TOPLEFT"}, "text": "Tgrnet:", "orig": "Tgrnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.704, "r_y0": 569.299, "r_x1": 206.625, "r_y1": 569.299, "r_x2": 206.625, "r_y2": 561.602, "r_x3": 178.704, "r_y3": 561.602, "coord_origin": "TOPLEFT"}, "text": "A table", "orig": "A table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.633, "r_y0": 569.299, "r_x1": 286.363, "r_y1": 569.299, "r_x2": 286.363, "r_y2": 561.602, "r_x3": 210.633, "r_y3": 561.602, "coord_origin": "TOPLEFT"}, "text": "graph reconstruction", "orig": "graph reconstruction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 580.258, "r_x1": 99.324, "r_y1": 580.258, "r_x2": 99.324, "r_y2": 572.561, "r_x3": 70.031, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 104.157, "r_y0": 580.258, "r_x1": 114.612, "r_y1": 580.258, "r_x2": 114.612, "r_y2": 572.561, "r_x3": 104.157, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.454, "r_y0": 580.258, "r_x1": 136.884, "r_y1": 580.258, "r_x2": 136.884, "r_y2": 572.561, "r_x3": 119.454, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.717, "r_y0": 580.258, "r_x1": 173.091, "r_y1": 580.258, "r_x2": 173.091, "r_y2": 572.561, "r_x3": 141.717, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.933, "r_y0": 580.258, "r_x1": 221.007, "r_y1": 580.258, "r_x2": 221.007, "r_y2": 572.561, "r_x3": 177.933, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.543, "r_y0": 580.129, "r_x1": 252.466, "r_y1": 580.129, "r_x2": 252.466, "r_y2": 572.399, "r_x3": 232.543, "r_y3": 572.399, "coord_origin": "TOPLEFT"}, "text": "arXiv", "orig": "arXiv", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.299, "r_y0": 580.129, "r_x1": 286.359, "r_y1": 580.129, "r_x2": 286.359, "r_y2": 572.399, "r_x3": 257.299, "r_y3": 572.399, "coord_origin": "TOPLEFT"}, "text": "preprint", "orig": "preprint", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 591.088, "r_x1": 135.531, "r_y1": 591.088, "r_x2": 135.531, "r_y2": 583.358, "r_x3": 70.031, "r_y3": 583.358, "coord_origin": "TOPLEFT"}, "text": "arXiv:2106.10598", "orig": "arXiv:2106.10598", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 135.53, "r_y0": 591.217, "r_x1": 167.899, "r_y1": 591.217, "r_x2": 167.899, "r_y2": 583.52, "r_x3": 135.53, "r_y3": 583.52, "coord_origin": "TOPLEFT"}, "text": ", 2021. 3", "orig": ", 2021. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[34] Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao, and Qingyong Li. Tgrnet: A table graph reconstruction network for table structure recognition. arXiv preprint arXiv:2106.10598 , 2021. 3"}, {"label": "list_item", "id": 10, "page_no": 9, "cluster": {"id": 10, "label": "list_item", "bbox": {"l": 50.112, "t": 594.844, "r": 286.363, "b": 635.418, "coord_origin": "TOPLEFT"}, "confidence": 0.8360886573791504, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 602.5409999999999, "r_x1": 65.05, "r_y1": 602.5409999999999, "r_x2": 65.05, "r_y2": 594.844, "r_x3": 50.112, "r_y3": 594.844, "coord_origin": "TOPLEFT"}, "text": "[35]", "orig": "[35]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 602.5409999999999, "r_x1": 286.359, "r_y1": 602.5409999999999, "r_x2": 286.359, "r_y2": 594.844, "r_x3": 70.035, "r_y3": 594.844, "coord_origin": "TOPLEFT"}, "text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 613.5, "r_x1": 109.107, "r_y1": 613.5, "r_x2": 109.107, "r_y2": 605.803, "r_x3": 70.031, "r_y3": 605.803, "coord_origin": "TOPLEFT"}, "text": "Jiebo Luo.", "orig": "Jiebo Luo.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.226, "r_y0": 613.5, "r_x1": 271.766, "r_y1": 613.5, "r_x2": 271.766, "r_y2": 605.803, "r_x3": 116.226, "r_y3": 605.803, "coord_origin": "TOPLEFT"}, "text": "Image captioning with semantic attention.", "orig": "Image captioning with semantic attention.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.894, "r_y0": 613.5, "r_x1": 286.363, "r_y1": 613.5, "r_x2": 286.363, "r_y2": 605.803, "r_x3": 278.894, "r_y3": 605.803, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 624.33, "r_x1": 286.363, "r_y1": 624.33, "r_x2": 286.363, "r_y2": 616.6, "r_x3": 70.031, "r_y3": 616.6, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE conference on computer vision and", "orig": "Proceedings of the IEEE conference on computer vision and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 635.289, "r_x1": 139.099, "r_y1": 635.289, "r_x2": 139.099, "r_y2": 627.559, "r_x3": 70.031, "r_y3": 627.559, "coord_origin": "TOPLEFT"}, "text": "pattern recognition", "orig": "pattern recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.098, "r_y0": 635.418, "r_x1": 238.957, "r_y1": 635.418, "r_x2": 238.957, "r_y2": 627.721, "r_x3": 139.098, "r_y3": 627.721, "coord_origin": "TOPLEFT"}, "text": ", pages 4651-4659, 2016. 4", "orig": ", pages 4651-4659, 2016. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[35] Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and Jiebo Luo. Image captioning with semantic attention. In Proceedings of the IEEE conference on computer vision and pattern recognition , pages 4651-4659, 2016. 4"}, {"label": "list_item", "id": 12, "page_no": 9, "cluster": {"id": 12, "label": "list_item", "bbox": {"l": 50.112, "t": 639.045, "r": 286.363, "b": 690.577, "coord_origin": "TOPLEFT"}, "confidence": 0.8079474568367004, "cells": [{"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 646.742, "r_x1": 65.05, "r_y1": 646.742, "r_x2": 65.05, "r_y2": 639.045, "r_x3": 50.112, "r_y3": 639.045, "coord_origin": "TOPLEFT"}, "text": "[36]", "orig": "[36]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 646.742, "r_x1": 286.359, "r_y1": 646.742, "r_x2": 286.359, "r_y2": 639.045, "r_x3": 70.035, "r_y3": 639.045, "coord_origin": "TOPLEFT"}, "text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 657.7, "r_x1": 286.363, "r_y1": 657.7, "r_x2": 286.363, "r_y2": 650.0029999999999, "r_x3": 70.031, "r_y3": 650.0029999999999, "coord_origin": "TOPLEFT"}, "text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 668.659, "r_x1": 286.363, "r_y1": 668.659, "r_x2": 286.363, "r_y2": 660.962, "r_x3": 70.031, "r_y3": 660.962, "coord_origin": "TOPLEFT"}, "text": "work for joint table identification and cell structure recogni-", "orig": "work for joint table identification and cell structure recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 679.6179999999999, "r_x1": 158.458, "r_y1": 679.6179999999999, "r_x2": 158.458, "r_y2": 671.921, "r_x3": 70.031, "r_y3": 671.921, "coord_origin": "TOPLEFT"}, "text": "tion using visual context.", "orig": "tion using visual context.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.528, "r_y0": 679.489, "r_x1": 286.362, "r_y1": 679.489, "r_x2": 286.362, "r_y2": 671.759, "r_x3": 160.528, "r_y3": 671.759, "coord_origin": "TOPLEFT"}, "text": "Winter Conference for Applications", "orig": "Winter Conference for Applications", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 690.448, "r_x1": 171.423, "r_y1": 690.448, "r_x2": 171.423, "r_y2": 682.718, "r_x3": 70.031, "r_y3": 682.718, "coord_origin": "TOPLEFT"}, "text": "in Computer Vision (WACV)", "orig": "in Computer Vision (WACV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.422, "r_y0": 690.577, "r_x1": 212.757, "r_y1": 690.577, "r_x2": 212.757, "r_y2": 682.88, "r_x3": 171.422, "r_y3": 682.88, "coord_origin": "TOPLEFT"}, "text": ", 2021. 2, 3", "orig": ", 2021. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[36] Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and Nancy Xin Ru Wang. Global table extractor (gte): A framework for joint table identification and cell structure recognition using visual context. Winter Conference for Applications in Computer Vision (WACV) , 2021. 2, 3"}, {"label": "list_item", "id": 8, "page_no": 9, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 50.112, "t": 694.204, "r": 286.363, "b": 712.86, "coord_origin": "TOPLEFT"}, "confidence": 0.8385783433914185, "cells": [{"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.901, "r_x1": 65.05, "r_y1": 701.901, "r_x2": 65.05, "r_y2": 694.204, "r_x3": 50.112, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "[37]", "orig": "[37]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 701.901, "r_x1": 80.992, "r_y1": 701.901, "r_x2": 80.992, "r_y2": 694.204, "r_x3": 70.035, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Xu", "orig": "Xu", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 89.062, "r_y0": 701.901, "r_x1": 114.715, "r_y1": 701.901, "r_x2": 114.715, "r_y2": 694.204, "r_x3": 89.062, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Zhong,", "orig": "Zhong,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.246, "r_y0": 701.901, "r_x1": 149.146, "r_y1": 701.901, "r_x2": 149.146, "r_y2": 694.204, "r_x3": 124.246, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Elaheh", "orig": "Elaheh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.225, "r_y0": 701.901, "r_x1": 209.373, "r_y1": 701.901, "r_x2": 209.373, "r_y2": 694.204, "r_x3": 157.225, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "ShafieiBavani,", "orig": "ShafieiBavani,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 218.904, "r_y0": 701.901, "r_x1": 231.852, "r_y1": 701.901, "r_x2": 231.852, "r_y2": 694.204, "r_x3": 218.904, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.931, "r_y0": 701.901, "r_x1": 269.323, "r_y1": 701.901, "r_x2": 269.323, "r_y2": 694.204, "r_x3": 239.931, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Antonio", "orig": "Antonio", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 277.392, "r_y0": 701.901, "r_x1": 286.359, "r_y1": 701.901, "r_x2": 286.359, "r_y2": 694.204, "r_x3": 277.392, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Ji-", "orig": "Ji-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 712.86, "r_x1": 116.719, "r_y1": 712.86, "r_x2": 116.719, "r_y2": 705.163, "r_x3": 70.031, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "meno Yepes.", "orig": "meno Yepes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.413, "r_y0": 712.86, "r_x1": 235.013, "r_y1": 712.86, "r_x2": 235.013, "r_y2": 705.163, "r_x3": 122.413, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "Image-based table recognition:", "orig": "Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.335, "r_y0": 712.86, "r_x1": 286.363, "r_y1": 712.86, "r_x2": 286.363, "r_y2": 705.163, "r_x3": 239.335, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "Data, model,", "orig": "Data, model,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[37] Xu Zhong, Elaheh ShafieiBavani, and Antonio Jimeno Yepes. Image-based table recognition: Data, model,"}, {"label": "list_item", "id": 14, "page_no": 9, "cluster": {"id": 14, "label": "list_item", "bbox": {"l": 328.781, "t": 76.12599999999998, "r": 545.115, "b": 116.69899999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.7556979060173035, "cells": [{"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 83.82299999999998, "r_x1": 383.646, "r_y1": 83.82299999999998, "r_x2": 383.646, "r_y2": 76.12599999999998, "r_x3": 328.781, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "and evaluation.", "orig": "and evaluation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 388.56, "r_y0": 83.82299999999998, "r_x1": 545.113, "r_y1": 83.82299999999998, "r_x2": 545.113, "r_y2": 76.12599999999998, "r_x3": 388.56, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "In Andrea Vedaldi, Horst Bischof, Thomas", "orig": "In Andrea Vedaldi, Horst Bischof, Thomas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 94.78099999999995, "r_x1": 472.306, "r_y1": 94.78099999999995, "r_x2": 472.306, "r_y2": 87.08399999999995, "r_x3": 328.781, "r_y3": 87.08399999999995, "coord_origin": "TOPLEFT"}, "text": "Brox, and Jan-Michael Frahm, editors,", "orig": "Brox, and Jan-Michael Frahm, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.885, "r_y0": 94.65200000000004, "r_x1": 545.115, "r_y1": 94.65200000000004, "r_x2": 545.115, "r_y2": 86.92200000000003, "r_x3": 475.885, "r_y3": 86.92200000000003, "coord_origin": "TOPLEFT"}, "text": "Computer Vision -", "orig": "Computer Vision -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 105.61099999999999, "r_x1": 371.927, "r_y1": 105.61099999999999, "r_x2": 371.927, "r_y2": 97.88099999999997, "r_x3": 328.781, "r_y3": 97.88099999999997, "coord_origin": "TOPLEFT"}, "text": "ECCV 2020", "orig": "ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 371.926, "r_y0": 105.74000000000001, "r_x1": 374.168, "r_y1": 105.74000000000001, "r_x2": 374.168, "r_y2": 98.043, "r_x3": 371.926, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.472, "r_y0": 105.74000000000001, "r_x1": 545.112, "r_y1": 105.74000000000001, "r_x2": 545.112, "r_y2": 98.043, "r_x3": 376.472, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "pages 564-580, Cham, 2020. Springer Interna-", "orig": "pages 564-580, Cham, 2020. Springer Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 116.69899999999996, "r_x1": 417.701, "r_y1": 116.69899999999996, "r_x2": 417.701, "r_y2": 109.00199999999995, "r_x3": 328.781, "r_y3": 109.00199999999995, "coord_origin": "TOPLEFT"}, "text": "tional Publishing. 2, 3, 7", "orig": "tional Publishing. 2, 3, 7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas Brox, and Jan-Michael Frahm, editors, Computer Vision ECCV 2020 , pages 564-580, Cham, 2020. Springer International Publishing. 2, 3, 7"}, {"label": "list_item", "id": 9, "page_no": 9, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 308.862, "t": 120.957, "r": 545.113, "b": 161.53099999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.8375797271728516, "cells": [{"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 128.654, "r_x1": 323.8, "r_y1": 128.654, "r_x2": 323.8, "r_y2": 120.957, "r_x3": 308.862, "r_y3": 120.957, "coord_origin": "TOPLEFT"}, "text": "[38]", "orig": "[38]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 128.654, "r_x1": 523.15, "r_y1": 128.654, "r_x2": 523.15, "r_y2": 120.957, "r_x3": 328.785, "r_y3": 120.957, "coord_origin": "TOPLEFT"}, "text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes.", "orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.171, "r_y0": 128.654, "r_x1": 545.109, "r_y1": 128.654, "r_x2": 545.109, "r_y2": 120.957, "r_x3": 528.171, "r_y3": 120.957, "coord_origin": "TOPLEFT"}, "text": "Pub-", "orig": "Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 139.61300000000006, "r_x1": 545.113, "r_y1": 139.61300000000006, "r_x2": 545.113, "r_y2": 131.91600000000005, "r_x3": 328.781, "r_y3": 131.91600000000005, "coord_origin": "TOPLEFT"}, "text": "laynet: Largest dataset ever for document layout analysis. In", "orig": "laynet: Largest dataset ever for document layout analysis. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 150.44299999999998, "r_x1": 545.113, "r_y1": 150.44299999999998, "r_x2": 545.113, "r_y2": 142.71299999999997, "r_x3": 328.781, "r_y3": 142.71299999999997, "coord_origin": "TOPLEFT"}, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 161.40200000000004, "r_x1": 406.322, "r_y1": 161.40200000000004, "r_x2": 406.322, "r_y2": 153.67200000000003, "r_x3": 328.781, "r_y3": 153.67200000000003, "coord_origin": "TOPLEFT"}, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 406.322, "r_y0": 161.53099999999995, "r_x1": 506.181, "r_y1": 161.53099999999995, "r_x2": 506.181, "r_y2": 153.83399999999995, "r_x3": 406.322, "r_y3": 153.83399999999995, "coord_origin": "TOPLEFT"}, "text": ", pages 1015-1022, 2019. 1", "orig": ", pages 1015-1022, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[38] Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Publaynet: Largest dataset ever for document layout analysis. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 1015-1022, 2019. 1"}, {"label": "page_footer", "id": 0, "page_no": 9, "cluster": {"id": 0, "label": "page_footer", "bbox": {"l": 292.63, "t": 734.402, "r": 302.593, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9069584012031555, "cells": [{"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.63, "r_y0": 742.954, "r_x1": 302.593, "r_y1": 742.954, "r_x2": 302.593, "r_y2": 734.402, "r_x3": 292.63, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "10"}], "body": [{"label": "text", "id": 15, "page_no": 9, "cluster": {"id": 15, "label": "text", "bbox": {"l": 70.031, "t": 75.96400000000006, "r": 286.362, "b": 94.78200000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.6886764168739319, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 83.69399999999996, "r_x1": 223.581, "r_y1": 83.69399999999996, "r_x2": 223.581, "r_y2": 75.96400000000006, "r_x3": 70.031, "r_y3": 75.96400000000006, "coord_origin": "TOPLEFT"}, "text": "Computer Vision and Pattern Recognition", "orig": "Computer Vision and Pattern Recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 223.579, "r_y0": 83.82299999999998, "r_x1": 225.821, "r_y1": 83.82299999999998, "r_x2": 225.821, "r_y2": 76.12599999999998, "r_x3": 223.579, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 229.183, "r_y0": 83.82299999999998, "r_x1": 286.362, "r_y1": 83.82299999999998, "r_x2": 286.362, "r_y2": 76.12599999999998, "r_x3": 229.183, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "pages 658-666,", "orig": "pages 658-666,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 94.78200000000004, "r_x1": 97.917, "r_y1": 94.78200000000004, "r_x2": 97.917, "r_y2": 87.08500000000004, "r_x3": 70.031, "r_y3": 87.08500000000004, "coord_origin": "TOPLEFT"}, "text": "2019. 6", "orig": "2019. 6", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Computer Vision and Pattern Recognition , pages 658-666, 2019. 6"}, {"label": "list_item", "id": 13, "page_no": 9, "cluster": {"id": 13, "label": "list_item", "bbox": {"l": 50.112, "t": 98.40800000000002, "r": 286.366, "b": 160.89999999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.7723011374473572, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 106.10500000000002, "r_x1": 65.05, "r_y1": 106.10500000000002, "r_x2": 65.05, "r_y2": 98.40800000000002, "r_x3": 50.112, "r_y3": 98.40800000000002, "coord_origin": "TOPLEFT"}, "text": "[26]", "orig": "[26]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 106.10500000000002, "r_x1": 286.359, "r_y1": 106.10500000000002, "r_x2": 286.359, "r_y2": 98.40800000000002, "r_x3": 70.035, "r_y3": 98.40800000000002, "coord_origin": "TOPLEFT"}, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 117.06399999999996, "r_x1": 286.363, "r_y1": 117.06399999999996, "r_x2": 286.363, "r_y2": 109.36699999999996, "r_x3": 70.031, "r_y3": 109.36699999999996, "coord_origin": "TOPLEFT"}, "text": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "orig": "gel, and Sheraz Ahmed. Deepdesrt: Deep learning for detec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 128.02300000000002, "r_x1": 286.363, "r_y1": 128.02300000000002, "r_x2": 286.363, "r_y2": 120.32600000000002, "r_x3": 70.031, "r_y3": 120.32600000000002, "coord_origin": "TOPLEFT"}, "text": "tion and structure recognition of tables in document images.", "orig": "tion and structure recognition of tables in document images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 138.98199999999997, "r_x1": 77.5, "r_y1": 138.98199999999997, "r_x2": 77.5, "r_y2": 131.28499999999997, "r_x3": 70.031, "r_y3": 131.28499999999997, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 80.56, "r_y0": 138.85299999999995, "r_x1": 286.366, "r_y1": 138.85299999999995, "r_x2": 286.366, "r_y2": 131.12300000000005, "r_x3": 80.56, "r_y3": 131.12300000000005, "coord_origin": "TOPLEFT"}, "text": "2017 14th IAPR International Conference on Document", "orig": "2017 14th IAPR International Conference on Document", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 149.812, "r_x1": 195.229, "r_y1": 149.812, "r_x2": 195.229, "r_y2": 142.082, "r_x3": 70.031, "r_y3": 142.082, "coord_origin": "TOPLEFT"}, "text": "Analysis and Recognition (ICDAR)", "orig": "Analysis and Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 195.231, "r_y0": 149.94100000000003, "r_x1": 286.365, "r_y1": 149.94100000000003, "r_x2": 286.365, "r_y2": 142.24400000000003, "r_x3": 195.231, "r_y3": 142.24400000000003, "coord_origin": "TOPLEFT"}, "text": ", volume 01, pages 1162-", "orig": ", volume 01, pages 1162-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 160.89999999999998, "r_x1": 120.333, "r_y1": 160.89999999999998, "r_x2": 120.333, "r_y2": 153.20299999999997, "r_x3": 70.031, "r_y3": 153.20299999999997, "coord_origin": "TOPLEFT"}, "text": "1167, 2017. 1", "orig": "1167, 2017. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[26] Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Dengel, and Sheraz Ahmed. Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR International Conference on Document Analysis and Recognition (ICDAR) , volume 01, pages 11621167, 2017. 1"}, {"label": "list_item", "id": 2, "page_no": 9, "cluster": {"id": 2, "label": "list_item", "bbox": {"l": 50.112, "t": 164.52700000000004, "r": 286.363, "b": 227.01800000000003, "coord_origin": "TOPLEFT"}, "confidence": 0.8580600619316101, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 172.22400000000005, "r_x1": 65.05, "r_y1": 172.22400000000005, "r_x2": 65.05, "r_y2": 164.52700000000004, "r_x3": 50.112, "r_y3": 164.52700000000004, "coord_origin": "TOPLEFT"}, "text": "[27]", "orig": "[27]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 172.22400000000005, "r_x1": 286.359, "r_y1": 172.22400000000005, "r_x2": 286.359, "r_y2": 164.52700000000004, "r_x3": 70.035, "r_y3": 164.52700000000004, "coord_origin": "TOPLEFT"}, "text": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "orig": "Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Den-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 183.183, "r_x1": 158.395, "r_y1": 183.183, "r_x2": 158.395, "r_y2": 175.486, "r_x3": 70.031, "r_y3": 175.486, "coord_origin": "TOPLEFT"}, "text": "gel, and Sheraz Ahmed.", "orig": "gel, and Sheraz Ahmed.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 164.035, "r_y0": 183.183, "r_x1": 202.877, "r_y1": 183.183, "r_x2": 202.877, "r_y2": 175.486, "r_x3": 164.035, "r_y3": 175.486, "coord_origin": "TOPLEFT"}, "text": "Deepdesrt:", "orig": "Deepdesrt:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 207.163, "r_y0": 183.183, "r_x1": 286.363, "r_y1": 183.183, "r_x2": 286.363, "r_y2": 175.486, "r_x3": 207.163, "r_y3": 175.486, "coord_origin": "TOPLEFT"}, "text": "Deep learning for de-", "orig": "Deep learning for de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 194.14200000000005, "r_x1": 286.363, "r_y1": 194.14200000000005, "r_x2": 286.363, "r_y2": 186.44500000000005, "r_x3": 70.031, "r_y3": 186.44500000000005, "coord_origin": "TOPLEFT"}, "text": "tection and structure recognition of tables in document im-", "orig": "tection and structure recognition of tables in document im-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 205.101, "r_x1": 88.206, "r_y1": 205.101, "r_x2": 88.206, "r_y2": 197.404, "r_x3": 70.031, "r_y3": 197.404, "coord_origin": "TOPLEFT"}, "text": "ages.", "orig": "ages.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 93.864, "r_y0": 205.101, "r_x1": 101.333, "r_y1": 205.101, "r_x2": 101.333, "r_y2": 197.404, "r_x3": 93.864, "r_y3": 197.404, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 104.331, "r_y0": 204.97199999999998, "r_x1": 286.358, "r_y1": 204.97199999999998, "r_x2": 286.358, "r_y2": 197.24199999999996, "r_x3": 104.331, "r_y3": 197.24199999999996, "coord_origin": "TOPLEFT"}, "text": "2017 14th IAPR international conference on doc-", "orig": "2017 14th IAPR international conference on doc-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 215.92999999999995, "r_x1": 220.487, "r_y1": 215.92999999999995, "r_x2": 220.487, "r_y2": 208.20000000000005, "r_x3": 70.031, "r_y3": 208.20000000000005, "coord_origin": "TOPLEFT"}, "text": "ument analysis and recognition (ICDAR)", "orig": "ument analysis and recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.484, "r_y0": 216.05899999999997, "r_x1": 222.726, "r_y1": 216.05899999999997, "r_x2": 222.726, "r_y2": 208.36199999999997, "r_x3": 220.484, "r_y3": 208.36199999999997, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 225.909, "r_y0": 216.05899999999997, "r_x1": 286.36, "r_y1": 216.05899999999997, "r_x2": 286.36, "r_y2": 208.36199999999997, "r_x3": 225.909, "r_y3": 208.36199999999997, "coord_origin": "TOPLEFT"}, "text": "volume 1, pages", "orig": "volume 1, pages", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 227.01800000000003, "r_x1": 166.653, "r_y1": 227.01800000000003, "r_x2": 166.653, "r_y2": 219.32100000000003, "r_x3": 70.031, "r_y3": 219.32100000000003, "coord_origin": "TOPLEFT"}, "text": "1162-1167. IEEE, 2017. 3", "orig": "1162-1167. IEEE, 2017. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[27] Sebastian Schreiber, Stefan Agne, Ivo Wolf, Andreas Dengel, and Sheraz Ahmed. Deepdesrt: Deep learning for detection and structure recognition of tables in document images. In 2017 14th IAPR international conference on document analysis and recognition (ICDAR) , volume 1, pages 1162-1167. IEEE, 2017. 3"}, {"label": "list_item", "id": 4, "page_no": 9, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 50.112, "t": 230.64499999999998, "r": 286.366, "b": 271.21900000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.8512731194496155, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 238.34199999999998, "r_x1": 65.05, "r_y1": 238.34199999999998, "r_x2": 65.05, "r_y2": 230.64499999999998, "r_x3": 50.112, "r_y3": 230.64499999999998, "coord_origin": "TOPLEFT"}, "text": "[28]", "orig": "[28]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 238.34199999999998, "r_x1": 179.147, "r_y1": 238.34199999999998, "r_x2": 179.147, "r_y2": 230.64499999999998, "r_x3": 70.035, "r_y3": 230.64499999999998, "coord_origin": "TOPLEFT"}, "text": "Faisal Shafait and Ray Smith.", "orig": "Faisal Shafait and Ray Smith.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 184.366, "r_y0": 238.34199999999998, "r_x1": 286.359, "r_y1": 238.34199999999998, "r_x2": 286.359, "r_y2": 230.64499999999998, "r_x3": 184.366, "r_y3": 230.64499999999998, "coord_origin": "TOPLEFT"}, "text": "Table detection in heteroge-", "orig": "Table detection in heteroge-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 249.30100000000004, "r_x1": 134.804, "r_y1": 249.30100000000004, "r_x2": 134.804, "r_y2": 241.60400000000004, "r_x3": 70.031, "r_y3": 241.60400000000004, "coord_origin": "TOPLEFT"}, "text": "neous documents.", "orig": "neous documents.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.7, "r_y0": 249.30100000000004, "r_x1": 147.169, "r_y1": 249.30100000000004, "r_x2": 147.169, "r_y2": 241.60400000000004, "r_x3": 139.7, "r_y3": 241.60400000000004, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 149.933, "r_y0": 249.17200000000003, "r_x1": 286.366, "r_y1": 249.17200000000003, "r_x2": 286.366, "r_y2": 241.442, "r_x3": 149.933, "r_y3": 241.442, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the 9th IAPR Interna-", "orig": "Proceedings of the 9th IAPR Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 260.131, "r_x1": 244.688, "r_y1": 260.131, "r_x2": 244.688, "r_y2": 252.40099999999995, "r_x3": 70.031, "r_y3": 252.40099999999995, "coord_origin": "TOPLEFT"}, "text": "tional Workshop on Document Analysis Systems", "orig": "tional Workshop on Document Analysis Systems", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 244.691, "r_y0": 260.26, "r_x1": 246.933, "r_y1": 260.26, "r_x2": 246.933, "r_y2": 252.563, "r_x3": 244.691, "r_y3": 252.563, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.775, "r_y0": 260.26, "r_x1": 286.358, "r_y1": 260.26, "r_x2": 286.358, "r_y2": 252.563, "r_x3": 249.775, "r_y3": 252.563, "coord_origin": "TOPLEFT"}, "text": "pages 65-", "orig": "pages 65-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 271.21900000000005, "r_x1": 111.366, "r_y1": 271.21900000000005, "r_x2": 111.366, "r_y2": 263.52200000000005, "r_x3": 70.031, "r_y3": 263.52200000000005, "coord_origin": "TOPLEFT"}, "text": "72, 2010. 2", "orig": "72, 2010. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[28] Faisal Shafait and Ray Smith. Table detection in heterogeneous documents. In Proceedings of the 9th IAPR International Workshop on Document Analysis Systems , pages 6572, 2010. 2"}, {"label": "list_item", "id": 5, "page_no": 9, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 50.112, "t": 274.846, "r": 286.366, "b": 326.378, "coord_origin": "TOPLEFT"}, "confidence": 0.8494512438774109, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 282.543, "r_x1": 65.05, "r_y1": 282.543, "r_x2": 65.05, "r_y2": 274.846, "r_x3": 50.112, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "[29]", "orig": "[29]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 282.543, "r_x1": 94.944, "r_y1": 282.543, "r_x2": 94.944, "r_y2": 274.846, "r_x3": 70.035, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Shoaib", "orig": "Shoaib", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 100.871, "r_y0": 282.543, "r_x1": 127.268, "r_y1": 282.543, "r_x2": 127.268, "r_y2": 274.846, "r_x3": 100.871, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Ahmed", "orig": "Ahmed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 133.195, "r_y0": 282.543, "r_x1": 165.832, "r_y1": 282.543, "r_x2": 165.832, "r_y2": 274.846, "r_x3": 133.195, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Siddiqui,", "orig": "Siddiqui,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 172.683, "r_y0": 282.543, "r_x1": 194.094, "r_y1": 282.543, "r_x2": 194.094, "r_y2": 274.846, "r_x3": 172.683, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Imran", "orig": "Imran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.021, "r_y0": 282.543, "r_x1": 211.48, "r_y1": 282.543, "r_x2": 211.48, "r_y2": 274.846, "r_x3": 200.021, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Ali", "orig": "Ali", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.407, "r_y0": 282.543, "r_x1": 239.438, "r_y1": 282.543, "r_x2": 239.438, "r_y2": 274.846, "r_x3": 217.407, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Fateh,", "orig": "Fateh,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.288, "r_y0": 282.543, "r_x1": 264.221, "r_y1": 282.543, "r_x2": 264.221, "r_y2": 274.846, "r_x3": 246.288, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Syed", "orig": "Syed", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 270.147, "r_y0": 282.543, "r_x1": 286.359, "r_y1": 282.543, "r_x2": 286.359, "r_y2": 274.846, "r_x3": 270.147, "r_y3": 274.846, "coord_origin": "TOPLEFT"}, "text": "Tah-", "orig": "Tah-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 293.502, "r_x1": 85.964, "r_y1": 293.502, "r_x2": 85.964, "r_y2": 285.805, "r_x3": 70.031, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "seen", "orig": "seen", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.021, "r_y0": 293.502, "r_x1": 108.945, "r_y1": 293.502, "r_x2": 108.945, "r_y2": 285.805, "r_x3": 91.021, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Raza", "orig": "Raza", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 114.002, "r_y0": 293.502, "r_x1": 135.674, "r_y1": 293.502, "r_x2": 135.674, "r_y2": 285.805, "r_x3": 114.002, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Rizvi,", "orig": "Rizvi,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.43, "r_y0": 293.502, "r_x1": 171.306, "r_y1": 293.502, "r_x2": 171.306, "r_y2": 285.805, "r_x3": 141.43, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Andreas", "orig": "Andreas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 176.364, "r_y0": 293.502, "r_x1": 204.5, "r_y1": 293.502, "r_x2": 204.5, "r_y2": 285.805, "r_x3": 176.364, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Dengel,", "orig": "Dengel,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.265, "r_y0": 293.502, "r_x1": 223.213, "r_y1": 293.502, "r_x2": 223.213, "r_y2": 285.805, "r_x3": 210.265, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.27, "r_y0": 293.502, "r_x1": 252.668, "r_y1": 293.502, "r_x2": 252.668, "r_y2": 285.805, "r_x3": 228.27, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Sheraz", "orig": "Sheraz", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.725, "r_y0": 293.502, "r_x1": 286.363, "r_y1": 293.502, "r_x2": 286.363, "r_y2": 285.805, "r_x3": 257.725, "r_y3": 285.805, "coord_origin": "TOPLEFT"}, "text": "Ahmed.", "orig": "Ahmed.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 304.461, "r_x1": 286.363, "r_y1": 304.461, "r_x2": 286.363, "r_y2": 296.764, "r_x3": 70.031, "r_y3": 296.764, "coord_origin": "TOPLEFT"}, "text": "Deeptabstr: Deep learning based table structure recognition.", "orig": "Deeptabstr: Deep learning based table structure recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 315.42, "r_x1": 77.5, "r_y1": 315.42, "r_x2": 77.5, "r_y2": 307.723, "r_x3": 70.031, "r_y3": 307.723, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 79.35, "r_y0": 315.291, "r_x1": 286.366, "r_y1": 315.291, "r_x2": 286.366, "r_y2": 307.561, "r_x3": 79.35, "r_y3": 307.561, "coord_origin": "TOPLEFT"}, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 326.249, "r_x1": 147.572, "r_y1": 326.249, "r_x2": 147.572, "r_y2": 318.519, "r_x3": 70.031, "r_y3": 318.519, "coord_origin": "TOPLEFT"}, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.572, "r_y0": 326.378, "r_x1": 271.335, "r_y1": 326.378, "r_x2": 271.335, "r_y2": 318.681, "r_x3": 147.572, "r_y3": 318.681, "coord_origin": "TOPLEFT"}, "text": ", pages 1403-1409. IEEE, 2019. 3", "orig": ", pages 1403-1409. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[29] Shoaib Ahmed Siddiqui, Imran Ali Fateh, Syed Tahseen Raza Rizvi, Andreas Dengel, and Sheraz Ahmed. Deeptabstr: Deep learning based table structure recognition. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 1403-1409. IEEE, 2019. 3"}, {"label": "list_item", "id": 3, "page_no": 9, "cluster": {"id": 3, "label": "list_item", "bbox": {"l": 50.112, "t": 330.005, "r": 286.363, "b": 381.538, "coord_origin": "TOPLEFT"}, "confidence": 0.8567671179771423, "cells": [{"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 337.702, "r_x1": 65.05, "r_y1": 337.702, "r_x2": 65.05, "r_y2": 330.005, "r_x3": 50.112, "r_y3": 330.005, "coord_origin": "TOPLEFT"}, "text": "[30]", "orig": "[30]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 337.702, "r_x1": 286.359, "r_y1": 337.702, "r_x2": 286.359, "r_y2": 330.005, "r_x3": 70.035, "r_y3": 330.005, "coord_origin": "TOPLEFT"}, "text": "Peter WJ Staar, Michele Dolfi, Christoph Auer, and Costas", "orig": "Peter WJ Staar, Michele Dolfi, Christoph Auer, and Costas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 348.661, "r_x1": 286.363, "r_y1": 348.661, "r_x2": 286.363, "r_y2": 340.964, "r_x3": 70.031, "r_y3": 340.964, "coord_origin": "TOPLEFT"}, "text": "Bekas. Corpus conversion service: A machine learning plat-", "orig": "Bekas. Corpus conversion service: A machine learning plat-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 359.62, "r_x1": 198.824, "r_y1": 359.62, "r_x2": 198.824, "r_y2": 351.923, "r_x3": 70.031, "r_y3": 351.923, "coord_origin": "TOPLEFT"}, "text": "form to ingest documents at scale.", "orig": "form to ingest documents at scale.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.06, "r_y0": 359.62, "r_x1": 213.529, "r_y1": 359.62, "r_x2": 213.529, "r_y2": 351.923, "r_x3": 206.06, "r_y3": 351.923, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 217.021, "r_y0": 359.491, "r_x1": 286.358, "r_y1": 359.491, "r_x2": 286.358, "r_y2": 351.761, "r_x3": 217.021, "r_y3": 351.761, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the", "orig": "Proceedings of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 370.45, "r_x1": 143.08, "r_y1": 370.45, "r_x2": 143.08, "r_y2": 362.72, "r_x3": 70.031, "r_y3": 362.72, "coord_origin": "TOPLEFT"}, "text": "24th ACM SIGKDD", "orig": "24th ACM SIGKDD", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 143.078, "r_y0": 370.579, "r_x1": 145.32, "r_y1": 370.579, "r_x2": 145.32, "r_y2": 362.882, "r_x3": 143.078, "r_y3": 362.882, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 148.108, "r_y0": 370.579, "r_x1": 286.361, "r_y1": 370.579, "r_x2": 286.361, "r_y2": 362.882, "r_x3": 148.108, "r_y3": 362.882, "coord_origin": "TOPLEFT"}, "text": "KDD '18, pages 774-782, New York,", "orig": "KDD '18, pages 774-782, New York,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 381.538, "r_x1": 161.157, "r_y1": 381.538, "r_x2": 161.157, "r_y2": 373.841, "r_x3": 70.031, "r_y3": 373.841, "coord_origin": "TOPLEFT"}, "text": "NY, USA, 2018. ACM. 1", "orig": "NY, USA, 2018. ACM. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[30] Peter WJ Staar, Michele Dolfi, Christoph Auer, and Costas Bekas. Corpus conversion service: A machine learning platform to ingest documents at scale. In Proceedings of the 24th ACM SIGKDD , KDD '18, pages 774-782, New York, NY, USA, 2018. ACM. 1"}, {"label": "list_item", "id": 1, "page_no": 9, "cluster": {"id": 1, "label": "list_item", "bbox": {"l": 50.112, "t": 385.165, "r": 286.364, "b": 458.615, "coord_origin": "TOPLEFT"}, "confidence": 0.8832162618637085, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 392.862, "r_x1": 65.05, "r_y1": 392.862, "r_x2": 65.05, "r_y2": 385.165, "r_x3": 50.112, "r_y3": 385.165, "coord_origin": "TOPLEFT"}, "text": "[31]", "orig": "[31]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 392.862, "r_x1": 286.359, "r_y1": 392.862, "r_x2": 286.359, "r_y2": 385.165, "r_x3": 70.035, "r_y3": 385.165, "coord_origin": "TOPLEFT"}, "text": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "orig": "Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszko-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 403.821, "r_x1": 84.225, "r_y1": 403.821, "r_x2": 84.225, "r_y2": 396.124, "r_x3": 70.031, "r_y3": 396.124, "coord_origin": "TOPLEFT"}, "text": "reit,", "orig": "reit,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 87.489, "r_y0": 403.821, "r_x1": 286.363, "r_y1": 403.821, "r_x2": 286.363, "r_y2": 396.124, "r_x3": 87.489, "r_y3": 396.124, "coord_origin": "TOPLEFT"}, "text": "Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "orig": "Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Il-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 414.78, "r_x1": 78.997, "r_y1": 414.78, "r_x2": 78.997, "r_y2": 407.083, "r_x3": 70.031, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "lia", "orig": "lia", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.871, "r_y0": 414.78, "r_x1": 125.47, "r_y1": 414.78, "r_x2": 125.47, "r_y2": 407.083, "r_x3": 82.871, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "Polosukhin.", "orig": "Polosukhin.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 133.908, "r_y0": 414.78, "r_x1": 167.783, "r_y1": 414.78, "r_x2": 167.783, "r_y2": 407.083, "r_x3": 133.908, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "Attention", "orig": "Attention", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.656, "r_y0": 414.78, "r_x1": 177.637, "r_y1": 414.78, "r_x2": 177.637, "r_y2": 407.083, "r_x3": 171.656, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 181.51, "r_y0": 414.78, "r_x1": 190.477, "r_y1": 414.78, "r_x2": 190.477, "r_y2": 407.083, "r_x3": 181.51, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "all", "orig": "all", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 194.341, "r_y0": 414.78, "r_x1": 230.834, "r_y1": 414.78, "r_x2": 230.834, "r_y2": 407.083, "r_x3": 194.341, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "you need.", "orig": "you need.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.272, "r_y0": 414.78, "r_x1": 246.741, "r_y1": 414.78, "r_x2": 246.741, "r_y2": 407.083, "r_x3": 239.272, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 250.614, "r_y0": 414.78, "r_x1": 255.842, "r_y1": 414.78, "r_x2": 255.842, "r_y2": 407.083, "r_x3": 250.614, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "I.", "orig": "I.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 259.715, "r_y0": 414.78, "r_x1": 286.363, "r_y1": 414.78, "r_x2": 286.363, "r_y2": 407.083, "r_x3": 259.715, "r_y3": 407.083, "coord_origin": "TOPLEFT"}, "text": "Guyon,", "orig": "Guyon,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 425.739, "r_x1": 286.363, "r_y1": 425.739, "r_x2": 286.363, "r_y2": 418.042, "r_x3": 70.031, "r_y3": 418.042, "coord_origin": "TOPLEFT"}, "text": "U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "orig": "U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vish-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 436.697, "r_x1": 196.762, "r_y1": 436.697, "r_x2": 196.762, "r_y2": 429.0, "r_x3": 70.031, "r_y3": 429.0, "coord_origin": "TOPLEFT"}, "text": "wanathan, and R. Garnett, editors,", "orig": "wanathan, and R. Garnett, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 200.202, "r_y0": 436.568, "r_x1": 286.36, "r_y1": 436.568, "r_x2": 286.36, "r_y2": 428.838, "r_x3": 200.202, "r_y3": 428.838, "coord_origin": "TOPLEFT"}, "text": "Advances in Neural In-", "orig": "Advances in Neural In-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 447.527, "r_x1": 189.194, "r_y1": 447.527, "r_x2": 189.194, "r_y2": 439.797, "r_x3": 70.031, "r_y3": 439.797, "coord_origin": "TOPLEFT"}, "text": "formation Processing Systems 30", "orig": "formation Processing Systems 30", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 189.195, "r_y0": 447.656, "r_x1": 191.437, "r_y1": 447.656, "r_x2": 191.437, "r_y2": 439.959, "r_x3": 189.195, "r_y3": 439.959, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.795, "r_y0": 447.656, "r_x1": 286.364, "r_y1": 447.656, "r_x2": 286.364, "r_y2": 439.959, "r_x3": 193.795, "r_y3": 439.959, "coord_origin": "TOPLEFT"}, "text": "pages 5998-6008. Curran", "orig": "pages 5998-6008. Curran", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 458.615, "r_x1": 158.924, "r_y1": 458.615, "r_x2": 158.924, "r_y2": 450.918, "r_x3": 70.031, "r_y3": 450.918, "coord_origin": "TOPLEFT"}, "text": "Associates, Inc., 2017. 5", "orig": "Associates, Inc., 2017. 5", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[31] Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit, Llion Jones, Aidan N Gomez, \u0141 ukasz Kaiser, and Illia Polosukhin. Attention is all you need. In I. Guyon, U. V. Luxburg, S. Bengio, H. Wallach, R. Fergus, S. Vishwanathan, and R. Garnett, editors, Advances in Neural Information Processing Systems 30 , pages 5998-6008. Curran Associates, Inc., 2017. 5"}, {"label": "list_item", "id": 6, "page_no": 9, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 50.112, "t": 462.242, "r": 286.363, "b": 502.816, "coord_origin": "TOPLEFT"}, "confidence": 0.8431925177574158, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 469.939, "r_x1": 65.05, "r_y1": 469.939, "r_x2": 65.05, "r_y2": 462.242, "r_x3": 50.112, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "[32]", "orig": "[32]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 469.939, "r_x1": 88.963, "r_y1": 469.939, "r_x2": 88.963, "r_y2": 462.242, "r_x3": 70.035, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "Oriol", "orig": "Oriol", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.81, "r_y0": 469.939, "r_x1": 122.274, "r_y1": 469.939, "r_x2": 122.274, "r_y2": 462.242, "r_x3": 92.81, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "Vinyals,", "orig": "Vinyals,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 126.524, "r_y0": 469.939, "r_x1": 194.695, "r_y1": 469.939, "r_x2": 194.695, "r_y2": 462.242, "r_x3": 126.524, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "Alexander Toshev,", "orig": "Alexander Toshev,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 198.954, "r_y0": 469.939, "r_x1": 286.359, "r_y1": 469.939, "r_x2": 286.359, "r_y2": 462.242, "r_x3": 198.954, "r_y3": 462.242, "coord_origin": "TOPLEFT"}, "text": "Samy Bengio, and Du-", "orig": "Samy Bengio, and Du-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 480.898, "r_x1": 116.28, "r_y1": 480.898, "r_x2": 116.28, "r_y2": 473.201, "r_x3": 70.031, "r_y3": 473.201, "coord_origin": "TOPLEFT"}, "text": "mitru Erhan.", "orig": "mitru Erhan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.484, "r_y0": 480.898, "r_x1": 175.924, "r_y1": 480.898, "r_x2": 175.924, "r_y2": 473.201, "r_x3": 122.484, "r_y3": 473.201, "coord_origin": "TOPLEFT"}, "text": "Show and tell:", "orig": "Show and tell:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 180.56, "r_y0": 480.898, "r_x1": 286.363, "r_y1": 480.898, "r_x2": 286.363, "r_y2": 473.201, "r_x3": 180.56, "r_y3": 473.201, "coord_origin": "TOPLEFT"}, "text": "A neural image caption gen-", "orig": "A neural image caption gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 491.857, "r_x1": 103.305, "r_y1": 491.857, "r_x2": 103.305, "r_y2": 484.16, "r_x3": 70.031, "r_y3": 484.16, "coord_origin": "TOPLEFT"}, "text": "erator. In", "orig": "erator. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 105.516, "r_y0": 491.728, "r_x1": 286.359, "r_y1": 491.728, "r_x2": 286.359, "r_y2": 483.998, "r_x3": 105.516, "r_y3": 483.998, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE Conference on Computer", "orig": "Proceedings of the IEEE Conference on Computer", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 502.687, "r_x1": 212.516, "r_y1": 502.687, "r_x2": 212.516, "r_y2": 494.957, "r_x3": 70.031, "r_y3": 494.957, "coord_origin": "TOPLEFT"}, "text": "Vision and Pattern Recognition (CVPR)", "orig": "Vision and Pattern Recognition (CVPR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 212.514, "r_y0": 502.816, "r_x1": 263.56, "r_y1": 502.816, "r_x2": 263.56, "r_y2": 495.119, "r_x3": 212.514, "r_y3": 495.119, "coord_origin": "TOPLEFT"}, "text": ", June 2015. 2", "orig": ", June 2015. 2", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[32] Oriol Vinyals, Alexander Toshev, Samy Bengio, and Dumitru Erhan. Show and tell: A neural image caption generator. In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) , June 2015. 2"}, {"label": "list_item", "id": 7, "page_no": 9, "cluster": {"id": 7, "label": "list_item", "bbox": {"l": 50.112, "t": 506.443, "r": 286.363, "b": 547.016, "coord_origin": "TOPLEFT"}, "confidence": 0.8405635952949524, "cells": [{"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 514.14, "r_x1": 65.05, "r_y1": 514.14, "r_x2": 65.05, "r_y2": 506.443, "r_x3": 50.112, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "[33]", "orig": "[33]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 514.14, "r_x1": 247.373, "r_y1": 514.14, "r_x2": 247.373, "r_y2": 506.443, "r_x3": 70.035, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "orig": "Wenyuan Xue, Qingyong Li, and Dacheng Tao.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 253.972, "r_y0": 514.14, "r_x1": 286.359, "r_y1": 514.14, "r_x2": 286.359, "r_y2": 506.443, "r_x3": 253.972, "r_y3": 506.443, "coord_origin": "TOPLEFT"}, "text": "Res2tim:", "orig": "Res2tim:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 525.0989999999999, "r_x1": 253.125, "r_y1": 525.0989999999999, "r_x2": 253.125, "r_y2": 517.402, "r_x3": 70.031, "r_y3": 517.402, "coord_origin": "TOPLEFT"}, "text": "reconstruct syntactic structures from table images.", "orig": "reconstruct syntactic structures from table images.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 258.155, "r_y0": 525.0989999999999, "r_x1": 265.624, "r_y1": 525.0989999999999, "r_x2": 265.624, "r_y2": 517.402, "r_x3": 258.155, "r_y3": 517.402, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 268.429, "r_y0": 524.97, "r_x1": 286.362, "r_y1": 524.97, "r_x2": 286.362, "r_y2": 517.24, "r_x3": 268.429, "r_y3": 517.24, "coord_origin": "TOPLEFT"}, "text": "2019", "orig": "2019", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 535.929, "r_x1": 286.363, "r_y1": 535.929, "r_x2": 286.363, "r_y2": 528.1990000000001, "r_x3": 70.031, "r_y3": 528.1990000000001, "coord_origin": "TOPLEFT"}, "text": "International Conference on Document Analysis and Recog-", "orig": "International Conference on Document Analysis and Recog-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 546.887, "r_x1": 125.255, "r_y1": 546.887, "r_x2": 125.255, "r_y2": 539.157, "r_x3": 70.031, "r_y3": 539.157, "coord_origin": "TOPLEFT"}, "text": "nition (ICDAR)", "orig": "nition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.254, "r_y0": 547.016, "r_x1": 240.051, "r_y1": 547.016, "r_x2": 240.051, "r_y2": 539.319, "r_x3": 125.254, "r_y3": 539.319, "coord_origin": "TOPLEFT"}, "text": ", pages 749-755. IEEE, 2019. 3", "orig": ", pages 749-755. IEEE, 2019. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[33] Wenyuan Xue, Qingyong Li, and Dacheng Tao. Res2tim: reconstruct syntactic structures from table images. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 749-755. IEEE, 2019. 3"}, {"label": "list_item", "id": 11, "page_no": 9, "cluster": {"id": 11, "label": "list_item", "bbox": {"l": 50.112, "t": 550.643, "r": 286.363, "b": 591.217, "coord_origin": "TOPLEFT"}, "confidence": 0.8241521716117859, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 558.34, "r_x1": 65.05, "r_y1": 558.34, "r_x2": 65.05, "r_y2": 550.643, "r_x3": 50.112, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "[34]", "orig": "[34]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 558.34, "r_x1": 125.008, "r_y1": 558.34, "r_x2": 125.008, "r_y2": 550.643, "r_x3": 70.035, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "Wenyuan Xue,", "orig": "Wenyuan Xue,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 129.823, "r_y0": 558.34, "r_x1": 181.676, "r_y1": 558.34, "r_x2": 181.676, "r_y2": 550.643, "r_x3": 129.823, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "Baosheng Yu,", "orig": "Baosheng Yu,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 186.491, "r_y0": 558.34, "r_x1": 286.359, "r_y1": 558.34, "r_x2": 286.359, "r_y2": 550.643, "r_x3": 186.491, "r_y3": 550.643, "coord_origin": "TOPLEFT"}, "text": "Wen Wang, Dacheng Tao,", "orig": "Wen Wang, Dacheng Tao,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 569.299, "r_x1": 137.082, "r_y1": 569.299, "r_x2": 137.082, "r_y2": 561.602, "r_x3": 70.031, "r_y3": 561.602, "coord_origin": "TOPLEFT"}, "text": "and Qingyong Li.", "orig": "and Qingyong Li.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 145.985, "r_y0": 569.299, "r_x1": 172.382, "r_y1": 569.299, "r_x2": 172.382, "r_y2": 561.602, "r_x3": 145.985, "r_y3": 561.602, "coord_origin": "TOPLEFT"}, "text": "Tgrnet:", "orig": "Tgrnet:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 178.704, "r_y0": 569.299, "r_x1": 206.625, "r_y1": 569.299, "r_x2": 206.625, "r_y2": 561.602, "r_x3": 178.704, "r_y3": 561.602, "coord_origin": "TOPLEFT"}, "text": "A table", "orig": "A table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.633, "r_y0": 569.299, "r_x1": 286.363, "r_y1": 569.299, "r_x2": 286.363, "r_y2": 561.602, "r_x3": 210.633, "r_y3": 561.602, "coord_origin": "TOPLEFT"}, "text": "graph reconstruction", "orig": "graph reconstruction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 580.258, "r_x1": 99.324, "r_y1": 580.258, "r_x2": 99.324, "r_y2": 572.561, "r_x3": 70.031, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "network", "orig": "network", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 104.157, "r_y0": 580.258, "r_x1": 114.612, "r_y1": 580.258, "r_x2": 114.612, "r_y2": 572.561, "r_x3": 104.157, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.454, "r_y0": 580.258, "r_x1": 136.884, "r_y1": 580.258, "r_x2": 136.884, "r_y2": 572.561, "r_x3": 119.454, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "table", "orig": "table", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 141.717, "r_y0": 580.258, "r_x1": 173.091, "r_y1": 580.258, "r_x2": 173.091, "r_y2": 572.561, "r_x3": 141.717, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "structure", "orig": "structure", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 177.933, "r_y0": 580.258, "r_x1": 221.007, "r_y1": 580.258, "r_x2": 221.007, "r_y2": 572.561, "r_x3": 177.933, "r_y3": 572.561, "coord_origin": "TOPLEFT"}, "text": "recognition.", "orig": "recognition.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.543, "r_y0": 580.129, "r_x1": 252.466, "r_y1": 580.129, "r_x2": 252.466, "r_y2": 572.399, "r_x3": 232.543, "r_y3": 572.399, "coord_origin": "TOPLEFT"}, "text": "arXiv", "orig": "arXiv", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 257.299, "r_y0": 580.129, "r_x1": 286.359, "r_y1": 580.129, "r_x2": 286.359, "r_y2": 572.399, "r_x3": 257.299, "r_y3": 572.399, "coord_origin": "TOPLEFT"}, "text": "preprint", "orig": "preprint", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 591.088, "r_x1": 135.531, "r_y1": 591.088, "r_x2": 135.531, "r_y2": 583.358, "r_x3": 70.031, "r_y3": 583.358, "coord_origin": "TOPLEFT"}, "text": "arXiv:2106.10598", "orig": "arXiv:2106.10598", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 135.53, "r_y0": 591.217, "r_x1": 167.899, "r_y1": 591.217, "r_x2": 167.899, "r_y2": 583.52, "r_x3": 135.53, "r_y3": 583.52, "coord_origin": "TOPLEFT"}, "text": ", 2021. 3", "orig": ", 2021. 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[34] Wenyuan Xue, Baosheng Yu, Wen Wang, Dacheng Tao, and Qingyong Li. Tgrnet: A table graph reconstruction network for table structure recognition. arXiv preprint arXiv:2106.10598 , 2021. 3"}, {"label": "list_item", "id": 10, "page_no": 9, "cluster": {"id": 10, "label": "list_item", "bbox": {"l": 50.112, "t": 594.844, "r": 286.363, "b": 635.418, "coord_origin": "TOPLEFT"}, "confidence": 0.8360886573791504, "cells": [{"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 602.5409999999999, "r_x1": 65.05, "r_y1": 602.5409999999999, "r_x2": 65.05, "r_y2": 594.844, "r_x3": 50.112, "r_y3": 594.844, "coord_origin": "TOPLEFT"}, "text": "[35]", "orig": "[35]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 602.5409999999999, "r_x1": 286.359, "r_y1": 602.5409999999999, "r_x2": 286.359, "r_y2": 594.844, "r_x3": 70.035, "r_y3": 594.844, "coord_origin": "TOPLEFT"}, "text": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "orig": "Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 613.5, "r_x1": 109.107, "r_y1": 613.5, "r_x2": 109.107, "r_y2": 605.803, "r_x3": 70.031, "r_y3": 605.803, "coord_origin": "TOPLEFT"}, "text": "Jiebo Luo.", "orig": "Jiebo Luo.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.226, "r_y0": 613.5, "r_x1": 271.766, "r_y1": 613.5, "r_x2": 271.766, "r_y2": 605.803, "r_x3": 116.226, "r_y3": 605.803, "coord_origin": "TOPLEFT"}, "text": "Image captioning with semantic attention.", "orig": "Image captioning with semantic attention.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 278.894, "r_y0": 613.5, "r_x1": 286.363, "r_y1": 613.5, "r_x2": 286.363, "r_y2": 605.803, "r_x3": 278.894, "r_y3": 605.803, "coord_origin": "TOPLEFT"}, "text": "In", "orig": "In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 624.33, "r_x1": 286.363, "r_y1": 624.33, "r_x2": 286.363, "r_y2": 616.6, "r_x3": 70.031, "r_y3": 616.6, "coord_origin": "TOPLEFT"}, "text": "Proceedings of the IEEE conference on computer vision and", "orig": "Proceedings of the IEEE conference on computer vision and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 635.289, "r_x1": 139.099, "r_y1": 635.289, "r_x2": 139.099, "r_y2": 627.559, "r_x3": 70.031, "r_y3": 627.559, "coord_origin": "TOPLEFT"}, "text": "pattern recognition", "orig": "pattern recognition", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 139.098, "r_y0": 635.418, "r_x1": 238.957, "r_y1": 635.418, "r_x2": 238.957, "r_y2": 627.721, "r_x3": 139.098, "r_y3": 627.721, "coord_origin": "TOPLEFT"}, "text": ", pages 4651-4659, 2016. 4", "orig": ", pages 4651-4659, 2016. 4", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[35] Quanzeng You, Hailin Jin, Zhaowen Wang, Chen Fang, and Jiebo Luo. Image captioning with semantic attention. In Proceedings of the IEEE conference on computer vision and pattern recognition , pages 4651-4659, 2016. 4"}, {"label": "list_item", "id": 12, "page_no": 9, "cluster": {"id": 12, "label": "list_item", "bbox": {"l": 50.112, "t": 639.045, "r": 286.363, "b": 690.577, "coord_origin": "TOPLEFT"}, "confidence": 0.8079474568367004, "cells": [{"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 646.742, "r_x1": 65.05, "r_y1": 646.742, "r_x2": 65.05, "r_y2": 639.045, "r_x3": 50.112, "r_y3": 639.045, "coord_origin": "TOPLEFT"}, "text": "[36]", "orig": "[36]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 646.742, "r_x1": 286.359, "r_y1": 646.742, "r_x2": 286.359, "r_y2": 639.045, "r_x3": 70.035, "r_y3": 639.045, "coord_origin": "TOPLEFT"}, "text": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "orig": "Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 657.7, "r_x1": 286.363, "r_y1": 657.7, "r_x2": 286.363, "r_y2": 650.0029999999999, "r_x3": 70.031, "r_y3": 650.0029999999999, "coord_origin": "TOPLEFT"}, "text": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "orig": "Nancy Xin Ru Wang. Global table extractor (gte): A frame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 668.659, "r_x1": 286.363, "r_y1": 668.659, "r_x2": 286.363, "r_y2": 660.962, "r_x3": 70.031, "r_y3": 660.962, "coord_origin": "TOPLEFT"}, "text": "work for joint table identification and cell structure recogni-", "orig": "work for joint table identification and cell structure recogni-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 679.6179999999999, "r_x1": 158.458, "r_y1": 679.6179999999999, "r_x2": 158.458, "r_y2": 671.921, "r_x3": 70.031, "r_y3": 671.921, "coord_origin": "TOPLEFT"}, "text": "tion using visual context.", "orig": "tion using visual context.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.528, "r_y0": 679.489, "r_x1": 286.362, "r_y1": 679.489, "r_x2": 286.362, "r_y2": 671.759, "r_x3": 160.528, "r_y3": 671.759, "coord_origin": "TOPLEFT"}, "text": "Winter Conference for Applications", "orig": "Winter Conference for Applications", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 690.448, "r_x1": 171.423, "r_y1": 690.448, "r_x2": 171.423, "r_y2": 682.718, "r_x3": 70.031, "r_y3": 682.718, "coord_origin": "TOPLEFT"}, "text": "in Computer Vision (WACV)", "orig": "in Computer Vision (WACV)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 171.422, "r_y0": 690.577, "r_x1": 212.757, "r_y1": 690.577, "r_x2": 212.757, "r_y2": 682.88, "r_x3": 171.422, "r_y3": 682.88, "coord_origin": "TOPLEFT"}, "text": ", 2021. 2, 3", "orig": ", 2021. 2, 3", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[36] Xinyi Zheng, Doug Burdick, Lucian Popa, Peter Zhong, and Nancy Xin Ru Wang. Global table extractor (gte): A framework for joint table identification and cell structure recognition using visual context. Winter Conference for Applications in Computer Vision (WACV) , 2021. 2, 3"}, {"label": "list_item", "id": 8, "page_no": 9, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 50.112, "t": 694.204, "r": 286.363, "b": 712.86, "coord_origin": "TOPLEFT"}, "confidence": 0.8385783433914185, "cells": [{"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 701.901, "r_x1": 65.05, "r_y1": 701.901, "r_x2": 65.05, "r_y2": 694.204, "r_x3": 50.112, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "[37]", "orig": "[37]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.035, "r_y0": 701.901, "r_x1": 80.992, "r_y1": 701.901, "r_x2": 80.992, "r_y2": 694.204, "r_x3": 70.035, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Xu", "orig": "Xu", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 89.062, "r_y0": 701.901, "r_x1": 114.715, "r_y1": 701.901, "r_x2": 114.715, "r_y2": 694.204, "r_x3": 89.062, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Zhong,", "orig": "Zhong,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 124.246, "r_y0": 701.901, "r_x1": 149.146, "r_y1": 701.901, "r_x2": 149.146, "r_y2": 694.204, "r_x3": 124.246, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Elaheh", "orig": "Elaheh", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 157.225, "r_y0": 701.901, "r_x1": 209.373, "r_y1": 701.901, "r_x2": 209.373, "r_y2": 694.204, "r_x3": 157.225, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "ShafieiBavani,", "orig": "ShafieiBavani,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 218.904, "r_y0": 701.901, "r_x1": 231.852, "r_y1": 701.901, "r_x2": 231.852, "r_y2": 694.204, "r_x3": 218.904, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.931, "r_y0": 701.901, "r_x1": 269.323, "r_y1": 701.901, "r_x2": 269.323, "r_y2": 694.204, "r_x3": 239.931, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Antonio", "orig": "Antonio", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 277.392, "r_y0": 701.901, "r_x1": 286.359, "r_y1": 701.901, "r_x2": 286.359, "r_y2": 694.204, "r_x3": 277.392, "r_y3": 694.204, "coord_origin": "TOPLEFT"}, "text": "Ji-", "orig": "Ji-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.031, "r_y0": 712.86, "r_x1": 116.719, "r_y1": 712.86, "r_x2": 116.719, "r_y2": 705.163, "r_x3": 70.031, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "meno Yepes.", "orig": "meno Yepes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.413, "r_y0": 712.86, "r_x1": 235.013, "r_y1": 712.86, "r_x2": 235.013, "r_y2": 705.163, "r_x3": 122.413, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "Image-based table recognition:", "orig": "Image-based table recognition:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 239.335, "r_y0": 712.86, "r_x1": 286.363, "r_y1": 712.86, "r_x2": 286.363, "r_y2": 705.163, "r_x3": 239.335, "r_y3": 705.163, "coord_origin": "TOPLEFT"}, "text": "Data, model,", "orig": "Data, model,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[37] Xu Zhong, Elaheh ShafieiBavani, and Antonio Jimeno Yepes. Image-based table recognition: Data, model,"}, {"label": "list_item", "id": 14, "page_no": 9, "cluster": {"id": 14, "label": "list_item", "bbox": {"l": 328.781, "t": 76.12599999999998, "r": 545.115, "b": 116.69899999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.7556979060173035, "cells": [{"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 83.82299999999998, "r_x1": 383.646, "r_y1": 83.82299999999998, "r_x2": 383.646, "r_y2": 76.12599999999998, "r_x3": 328.781, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "and evaluation.", "orig": "and evaluation.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 388.56, "r_y0": 83.82299999999998, "r_x1": 545.113, "r_y1": 83.82299999999998, "r_x2": 545.113, "r_y2": 76.12599999999998, "r_x3": 388.56, "r_y3": 76.12599999999998, "coord_origin": "TOPLEFT"}, "text": "In Andrea Vedaldi, Horst Bischof, Thomas", "orig": "In Andrea Vedaldi, Horst Bischof, Thomas", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 94.78099999999995, "r_x1": 472.306, "r_y1": 94.78099999999995, "r_x2": 472.306, "r_y2": 87.08399999999995, "r_x3": 328.781, "r_y3": 87.08399999999995, "coord_origin": "TOPLEFT"}, "text": "Brox, and Jan-Michael Frahm, editors,", "orig": "Brox, and Jan-Michael Frahm, editors,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 475.885, "r_y0": 94.65200000000004, "r_x1": 545.115, "r_y1": 94.65200000000004, "r_x2": 545.115, "r_y2": 86.92200000000003, "r_x3": 475.885, "r_y3": 86.92200000000003, "coord_origin": "TOPLEFT"}, "text": "Computer Vision -", "orig": "Computer Vision -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 105.61099999999999, "r_x1": 371.927, "r_y1": 105.61099999999999, "r_x2": 371.927, "r_y2": 97.88099999999997, "r_x3": 328.781, "r_y3": 97.88099999999997, "coord_origin": "TOPLEFT"}, "text": "ECCV 2020", "orig": "ECCV 2020", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 371.926, "r_y0": 105.74000000000001, "r_x1": 374.168, "r_y1": 105.74000000000001, "r_x2": 374.168, "r_y2": 98.043, "r_x3": 371.926, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": ",", "orig": ",", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 376.472, "r_y0": 105.74000000000001, "r_x1": 545.112, "r_y1": 105.74000000000001, "r_x2": 545.112, "r_y2": 98.043, "r_x3": 376.472, "r_y3": 98.043, "coord_origin": "TOPLEFT"}, "text": "pages 564-580, Cham, 2020. Springer Interna-", "orig": "pages 564-580, Cham, 2020. Springer Interna-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 116.69899999999996, "r_x1": 417.701, "r_y1": 116.69899999999996, "r_x2": 417.701, "r_y2": 109.00199999999995, "r_x3": 328.781, "r_y3": 109.00199999999995, "coord_origin": "TOPLEFT"}, "text": "tional Publishing. 2, 3, 7", "orig": "tional Publishing. 2, 3, 7", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "and evaluation. In Andrea Vedaldi, Horst Bischof, Thomas Brox, and Jan-Michael Frahm, editors, Computer Vision ECCV 2020 , pages 564-580, Cham, 2020. Springer International Publishing. 2, 3, 7"}, {"label": "list_item", "id": 9, "page_no": 9, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 308.862, "t": 120.957, "r": 545.113, "b": 161.53099999999995, "coord_origin": "TOPLEFT"}, "confidence": 0.8375797271728516, "cells": [{"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 128.654, "r_x1": 323.8, "r_y1": 128.654, "r_x2": 323.8, "r_y2": 120.957, "r_x3": 308.862, "r_y3": 120.957, "coord_origin": "TOPLEFT"}, "text": "[38]", "orig": "[38]", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.785, "r_y0": 128.654, "r_x1": 523.15, "r_y1": 128.654, "r_x2": 523.15, "r_y2": 120.957, "r_x3": 328.785, "r_y3": 120.957, "coord_origin": "TOPLEFT"}, "text": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes.", "orig": "Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 528.171, "r_y0": 128.654, "r_x1": 545.109, "r_y1": 128.654, "r_x2": 545.109, "r_y2": 120.957, "r_x3": 528.171, "r_y3": 120.957, "coord_origin": "TOPLEFT"}, "text": "Pub-", "orig": "Pub-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 139.61300000000006, "r_x1": 545.113, "r_y1": 139.61300000000006, "r_x2": 545.113, "r_y2": 131.91600000000005, "r_x3": 328.781, "r_y3": 131.91600000000005, "coord_origin": "TOPLEFT"}, "text": "laynet: Largest dataset ever for document layout analysis. In", "orig": "laynet: Largest dataset ever for document layout analysis. In", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 150.44299999999998, "r_x1": 545.113, "r_y1": 150.44299999999998, "r_x2": 545.113, "r_y2": 142.71299999999997, "r_x3": 328.781, "r_y3": 142.71299999999997, "coord_origin": "TOPLEFT"}, "text": "2019 International Conference on Document Analysis and", "orig": "2019 International Conference on Document Analysis and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 328.781, "r_y0": 161.40200000000004, "r_x1": 406.322, "r_y1": 161.40200000000004, "r_x2": 406.322, "r_y2": 153.67200000000003, "r_x3": 328.781, "r_y3": 153.67200000000003, "coord_origin": "TOPLEFT"}, "text": "Recognition (ICDAR)", "orig": "Recognition (ICDAR)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 406.322, "r_y0": 161.53099999999995, "r_x1": 506.181, "r_y1": 161.53099999999995, "r_x2": 506.181, "r_y2": 153.83399999999995, "r_x3": 406.322, "r_y3": 153.83399999999995, "coord_origin": "TOPLEFT"}, "text": ", pages 1015-1022, 2019. 1", "orig": ", pages 1015-1022, 2019. 1", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "[38] Xu Zhong, Jianbin Tang, and Antonio Jimeno Yepes. Publaynet: Largest dataset ever for document layout analysis. In 2019 International Conference on Document Analysis and Recognition (ICDAR) , pages 1015-1022, 2019. 1"}], "headers": [{"label": "page_footer", "id": 0, "page_no": 9, "cluster": {"id": 0, "label": "page_footer", "bbox": {"l": 292.63, "t": 734.402, "r": 302.593, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9069584012031555, "cells": [{"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.63, "r_y0": 742.954, "r_x1": 302.593, "r_y1": 742.954, "r_x2": 302.593, "r_y2": 734.402, "r_x3": 292.63, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "10", "orig": "10", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "10"}]}}, {"page_no": 10, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.842, "r_y0": 121.32299999999998, "r_x1": 465.376, "r_y1": 121.32299999999998, "r_x2": 465.376, "r_y2": 110.57500000000005, "r_x3": 132.842, "r_y3": 110.57500000000005, "coord_origin": "TOPLEFT"}, "text": "TableFormer: Table Structure Understanding with Transformers", "orig": "TableFormer: Table Structure Understanding with Transformers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.184, "r_y0": 135.48400000000004, "r_x1": 375.043, "r_y1": 135.48400000000004, "r_x2": 375.043, "r_y2": 122.42399999999998, "r_x3": 220.184, "r_y3": 122.42399999999998, "coord_origin": "TOPLEFT"}, "text": "Supplementary Material", "orig": "Supplementary Material", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 171.909, "r_x1": 175.964, "r_y1": 171.909, "r_x2": 175.964, "r_y2": 161.16099999999994, "r_x3": 50.112, "r_y3": 161.16099999999994, "coord_origin": "TOPLEFT"}, "text": "1. Details on the datasets", "orig": "1. Details on the datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 190.83100000000002, "r_x1": 150.364, "r_y1": 190.83100000000002, "r_x2": 150.364, "r_y2": 180.97900000000004, "r_x3": 50.112, "r_y3": 180.97900000000004, "coord_origin": "TOPLEFT"}, "text": "1.1. Data preparation", "orig": "1.1. Data preparation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 208.74099999999999, "r_x1": 286.365, "r_y1": 208.74099999999999, "r_x2": 286.365, "r_y2": 200.18899999999996, "r_x3": 62.067, "r_y3": 200.18899999999996, "coord_origin": "TOPLEFT"}, "text": "As a first step of our data preparation process, we have", "orig": "As a first step of our data preparation process, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 220.697, "r_x1": 286.365, "r_y1": 220.697, "r_x2": 286.365, "r_y2": 212.14499999999998, "r_x3": 50.112, "r_y3": 212.14499999999998, "coord_origin": "TOPLEFT"}, "text": "calculated statistics over the datasets across the following", "orig": "calculated statistics over the datasets across the following", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 232.65200000000004, "r_x1": 286.365, "r_y1": 232.65200000000004, "r_x2": 286.365, "r_y2": 224.10000000000002, "r_x3": 50.112, "r_y3": 224.10000000000002, "coord_origin": "TOPLEFT"}, "text": "dimensions: (1) table size measured in the number of rows", "orig": "dimensions: (1) table size measured in the number of rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 244.60699999999997, "r_x1": 286.365, "r_y1": 244.60699999999997, "r_x2": 286.365, "r_y2": 236.05499999999995, "r_x3": 50.112, "r_y3": 236.05499999999995, "coord_origin": "TOPLEFT"}, "text": "and columns, (2) complexity of the table, (3) strictness of", "orig": "and columns, (2) complexity of the table, (3) strictness of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 256.562, "r_x1": 286.365, "r_y1": 256.562, "r_x2": 286.365, "r_y2": 248.01, "r_x3": 50.112, "r_y3": 248.01, "coord_origin": "TOPLEFT"}, "text": "the provided HTML structure and (4) completeness (i.e. no", "orig": "the provided HTML structure and (4) completeness (i.e. no", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 268.51700000000005, "r_x1": 286.365, "r_y1": 268.51700000000005, "r_x2": 286.365, "r_y2": 259.96500000000003, "r_x3": 50.112, "r_y3": 259.96500000000003, "coord_origin": "TOPLEFT"}, "text": "omitted bounding boxes). Atable is considered to be simple", "orig": "omitted bounding boxes). Atable is considered to be simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 280.472, "r_x1": 286.365, "r_y1": 280.472, "r_x2": 286.365, "r_y2": 271.91999999999996, "r_x3": 50.112, "r_y3": 271.91999999999996, "coord_origin": "TOPLEFT"}, "text": "if it does not contain row spans or column spans. Addition-", "orig": "if it does not contain row spans or column spans. Addition-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 292.428, "r_x1": 286.365, "r_y1": 292.428, "r_x2": 286.365, "r_y2": 283.876, "r_x3": 50.112, "r_y3": 283.876, "coord_origin": "TOPLEFT"}, "text": "ally, a table has a strict HTMLstructure if every row has the", "orig": "ally, a table has a strict HTMLstructure if every row has the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 304.383, "r_x1": 286.365, "r_y1": 304.383, "r_x2": 286.365, "r_y2": 295.831, "r_x3": 50.112, "r_y3": 295.831, "coord_origin": "TOPLEFT"}, "text": "same number of columns after taking into account any row", "orig": "same number of columns after taking into account any row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 316.338, "r_x1": 118.834, "r_y1": 316.338, "r_x2": 118.834, "r_y2": 307.786, "r_x3": 50.112, "r_y3": 307.786, "coord_origin": "TOPLEFT"}, "text": "or column spans.", "orig": "or column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 123.307, "r_y0": 316.338, "r_x1": 286.365, "r_y1": 316.338, "r_x2": 286.365, "r_y2": 307.786, "r_x3": 123.307, "r_y3": 307.786, "coord_origin": "TOPLEFT"}, "text": "Therefore a strict HTML structure looks", "orig": "Therefore a strict HTML structure looks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 328.293, "r_x1": 127.163, "r_y1": 328.293, "r_x2": 127.163, "r_y2": 319.741, "r_x3": 50.112, "r_y3": 319.741, "coord_origin": "TOPLEFT"}, "text": "always rectangular.", "orig": "always rectangular.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 131.257, "r_y0": 328.293, "r_x1": 286.365, "r_y1": 328.293, "r_x2": 286.365, "r_y2": 319.741, "r_x3": 131.257, "r_y3": 319.741, "coord_origin": "TOPLEFT"}, "text": "However, HTML is a lenient encoding", "orig": "However, HTML is a lenient encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 340.248, "r_x1": 95.163, "r_y1": 340.248, "r_x2": 95.163, "r_y2": 331.696, "r_x3": 50.112, "r_y3": 331.696, "coord_origin": "TOPLEFT"}, "text": "format, i.e.", "orig": "format, i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.459, "r_y0": 340.248, "r_x1": 286.365, "r_y1": 340.248, "r_x2": 286.365, "r_y2": 331.696, "r_x3": 101.459, "r_y3": 331.696, "coord_origin": "TOPLEFT"}, "text": "tables with rows of different sizes might still", "orig": "tables with rows of different sizes might still", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 352.204, "r_x1": 257.942, "r_y1": 352.204, "r_x2": 257.942, "r_y2": 343.652, "r_x3": 50.112, "r_y3": 343.652, "coord_origin": "TOPLEFT"}, "text": "be regarded as correct due to implicit display rules.", "orig": "be regarded as correct due to implicit display rules.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.574, "r_y0": 352.204, "r_x1": 286.365, "r_y1": 352.204, "r_x2": 286.365, "r_y2": 343.652, "r_x3": 262.574, "r_y3": 343.652, "coord_origin": "TOPLEFT"}, "text": "These", "orig": "These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 364.159, "r_x1": 286.365, "r_y1": 364.159, "r_x2": 286.365, "r_y2": 355.607, "r_x3": 50.112, "r_y3": 355.607, "coord_origin": "TOPLEFT"}, "text": "implicit rules leave room for ambiguity, which we want to", "orig": "implicit rules leave room for ambiguity, which we want to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 376.114, "r_x1": 286.365, "r_y1": 376.114, "r_x2": 286.365, "r_y2": 367.562, "r_x3": 50.112, "r_y3": 367.562, "coord_origin": "TOPLEFT"}, "text": "avoid. As such, we prefer to have 'strict' tables, i.e. tables", "orig": "avoid. As such, we prefer to have 'strict' tables, i.e. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 388.069, "r_x1": 230.804, "r_y1": 388.069, "r_x2": 230.804, "r_y2": 379.517, "r_x3": 50.112, "r_y3": 379.517, "coord_origin": "TOPLEFT"}, "text": "where every row has exactly the same length.", "orig": "where every row has exactly the same length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 400.226, "r_x1": 236.243, "r_y1": 400.226, "r_x2": 236.243, "r_y2": 391.674, "r_x3": 62.067, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "We have developed a technique that tries", "orig": "We have developed a technique that tries", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.726, "r_y0": 400.226, "r_x1": 248.477, "r_y1": 400.226, "r_x2": 248.477, "r_y2": 391.674, "r_x3": 240.726, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 252.96, "r_y0": 400.226, "r_x1": 277.458, "r_y1": 400.226, "r_x2": 277.458, "r_y2": 391.674, "r_x3": 252.96, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "derive", "orig": "derive", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.942, "r_y0": 400.226, "r_x1": 286.365, "r_y1": 400.226, "r_x2": 286.365, "r_y2": 391.674, "r_x3": 281.942, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 412.181, "r_x1": 223.571, "r_y1": 412.181, "r_x2": 223.571, "r_y2": 403.629, "r_x3": 50.112, "r_y3": 403.629, "coord_origin": "TOPLEFT"}, "text": "missing bounding box out of its neighbors.", "orig": "missing bounding box out of its neighbors.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.004, "r_y0": 412.181, "r_x1": 286.365, "r_y1": 412.181, "r_x2": 286.365, "r_y2": 403.629, "r_x3": 228.004, "r_y3": 403.629, "coord_origin": "TOPLEFT"}, "text": "As a first step,", "orig": "As a first step,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 424.136, "r_x1": 286.365, "r_y1": 424.136, "r_x2": 286.365, "r_y2": 415.584, "r_x3": 50.112, "r_y3": 415.584, "coord_origin": "TOPLEFT"}, "text": "we use the annotation data to generate the most fine-grained", "orig": "we use the annotation data to generate the most fine-grained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 436.092, "r_x1": 189.519, "r_y1": 436.092, "r_x2": 189.519, "r_y2": 427.54, "r_x3": 50.112, "r_y3": 427.54, "coord_origin": "TOPLEFT"}, "text": "grid that covers the table structure.", "orig": "grid that covers the table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.414, "r_y0": 436.092, "r_x1": 286.365, "r_y1": 436.092, "r_x2": 286.365, "r_y2": 427.54, "r_x3": 193.414, "r_y3": 427.54, "coord_origin": "TOPLEFT"}, "text": "In case of strict HTML", "orig": "In case of strict HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 448.047, "r_x1": 286.365, "r_y1": 448.047, "r_x2": 286.365, "r_y2": 439.495, "r_x3": 50.112, "r_y3": 439.495, "coord_origin": "TOPLEFT"}, "text": "tables, all grid squares are associated with some table cell", "orig": "tables, all grid squares are associated with some table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 460.002, "r_x1": 286.365, "r_y1": 460.002, "r_x2": 286.365, "r_y2": 451.45, "r_x3": 50.112, "r_y3": 451.45, "coord_origin": "TOPLEFT"}, "text": "and in the presence of table spans a cell extends across mul-", "orig": "and in the presence of table spans a cell extends across mul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 471.957, "r_x1": 286.365, "r_y1": 471.957, "r_x2": 286.365, "r_y2": 463.405, "r_x3": 50.112, "r_y3": 463.405, "coord_origin": "TOPLEFT"}, "text": "tiple grid squares. When enough bounding boxes are known", "orig": "tiple grid squares. When enough bounding boxes are known", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 483.912, "r_x1": 143.76, "r_y1": 483.912, "r_x2": 143.76, "r_y2": 475.36, "r_x3": 50.112, "r_y3": 475.36, "coord_origin": "TOPLEFT"}, "text": "for a rectangular table,", "orig": "for a rectangular table,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.696, "r_y0": 483.912, "r_x1": 153.235, "r_y1": 483.912, "r_x2": 153.235, "r_y2": 475.36, "r_x3": 147.696, "r_y3": 475.36, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 156.881, "r_y0": 483.912, "r_x1": 163.526, "r_y1": 483.912, "r_x2": 163.526, "r_y2": 475.36, "r_x3": 156.881, "r_y3": 475.36, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.173, "r_y0": 483.912, "r_x1": 286.365, "r_y1": 483.912, "r_x2": 286.365, "r_y2": 475.36, "r_x3": 167.173, "r_y3": 475.36, "coord_origin": "TOPLEFT"}, "text": "possible to compute the geo-", "orig": "possible to compute the geo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 495.867, "r_x1": 286.365, "r_y1": 495.867, "r_x2": 286.365, "r_y2": 487.315, "r_x3": 50.112, "r_y3": 487.315, "coord_origin": "TOPLEFT"}, "text": "metrical border lines between the grid rows and columns.", "orig": "metrical border lines between the grid rows and columns.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 507.823, "r_x1": 286.365, "r_y1": 507.823, "r_x2": 286.365, "r_y2": 499.271, "r_x3": 50.112, "r_y3": 499.271, "coord_origin": "TOPLEFT"}, "text": "Eventually this information is used to generate the missing", "orig": "Eventually this information is used to generate the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 519.778, "r_x1": 286.365, "r_y1": 519.778, "r_x2": 286.365, "r_y2": 511.226, "r_x3": 50.112, "r_y3": 511.226, "coord_origin": "TOPLEFT"}, "text": "bounding boxes. Additionally, the existence of unused grid", "orig": "bounding boxes. Additionally, the existence of unused grid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 531.733, "r_x1": 286.365, "r_y1": 531.733, "r_x2": 286.365, "r_y2": 523.181, "r_x3": 50.112, "r_y3": 523.181, "coord_origin": "TOPLEFT"}, "text": "squares indicates that the table rows have unequal number", "orig": "squares indicates that the table rows have unequal number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 543.688, "r_x1": 286.365, "r_y1": 543.688, "r_x2": 286.365, "r_y2": 535.136, "r_x3": 50.112, "r_y3": 535.136, "coord_origin": "TOPLEFT"}, "text": "of columns and the overall structure is non-strict. The gen-", "orig": "of columns and the overall structure is non-strict. The gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 555.643, "r_x1": 286.365, "r_y1": 555.643, "r_x2": 286.365, "r_y2": 547.091, "r_x3": 50.112, "r_y3": 547.091, "coord_origin": "TOPLEFT"}, "text": "eration of missing bounding boxes for non-strict HTML ta-", "orig": "eration of missing bounding boxes for non-strict HTML ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 567.5989999999999, "r_x1": 257.474, "r_y1": 567.5989999999999, "r_x2": 257.474, "r_y2": 559.047, "r_x3": 50.112, "r_y3": 559.047, "coord_origin": "TOPLEFT"}, "text": "bles is ambiguous and therefore quite challenging.", "orig": "bles is ambiguous and therefore quite challenging.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.949, "r_y0": 567.5989999999999, "r_x1": 286.365, "r_y1": 567.5989999999999, "r_x2": 286.365, "r_y2": 559.047, "r_x3": 263.949, "r_y3": 559.047, "coord_origin": "TOPLEFT"}, "text": "Thus,", "orig": "Thus,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 579.554, "r_x1": 242.251, "r_y1": 579.554, "r_x2": 242.251, "r_y2": 571.002, "r_x3": 50.112, "r_y3": 571.002, "coord_origin": "TOPLEFT"}, "text": "we have decided to simply discard those tables.", "orig": "we have decided to simply discard those tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.714, "r_y0": 579.554, "r_x1": 286.365, "r_y1": 579.554, "r_x2": 286.365, "r_y2": 571.002, "r_x3": 246.714, "r_y3": 571.002, "coord_origin": "TOPLEFT"}, "text": "In case of", "orig": "In case of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 591.509, "r_x1": 286.365, "r_y1": 591.509, "r_x2": 286.365, "r_y2": 582.957, "r_x3": 50.112, "r_y3": 582.957, "coord_origin": "TOPLEFT"}, "text": "PubTabNet we have computed missing bounding boxes for", "orig": "PubTabNet we have computed missing bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 603.4639999999999, "r_x1": 286.365, "r_y1": 603.4639999999999, "r_x2": 286.365, "r_y2": 594.912, "r_x3": 50.112, "r_y3": 594.912, "coord_origin": "TOPLEFT"}, "text": "48% of the simple and 69% of the complex tables. Regard-", "orig": "48% of the simple and 69% of the complex tables. Regard-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 615.419, "r_x1": 286.365, "r_y1": 615.419, "r_x2": 286.365, "r_y2": 606.867, "r_x3": 50.112, "r_y3": 606.867, "coord_origin": "TOPLEFT"}, "text": "ing FinTabNet, 68% of the simple and 98% of the complex", "orig": "ing FinTabNet, 68% of the simple and 98% of the complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 627.374, "r_x1": 242.261, "r_y1": 627.374, "r_x2": 242.261, "r_y2": 618.822, "r_x3": 50.112, "r_y3": 618.822, "coord_origin": "TOPLEFT"}, "text": "tables require the generation of bounding boxes.", "orig": "tables require the generation of bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 639.531, "r_x1": 286.365, "r_y1": 639.531, "r_x2": 286.365, "r_y2": 630.979, "r_x3": 62.067, "r_y3": 630.979, "coord_origin": "TOPLEFT"}, "text": "Figure 7 illustrates the distribution of the tables across", "orig": "Figure 7 illustrates the distribution of the tables across", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 651.487, "r_x1": 179.905, "r_y1": 651.487, "r_x2": 179.905, "r_y2": 642.935, "r_x3": 50.112, "r_y3": 642.935, "coord_origin": "TOPLEFT"}, "text": "different dimensions per dataset.", "orig": "different dimensions per dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 672.242, "r_x1": 153.608, "r_y1": 672.242, "r_x2": 153.608, "r_y2": 662.39, "r_x3": 50.112, "r_y3": 662.39, "coord_origin": "TOPLEFT"}, "text": "1.2. Synthetic datasets", "orig": "1.2. Synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 690.152, "r_x1": 286.365, "r_y1": 690.152, "r_x2": 286.365, "r_y2": 681.6, "r_x3": 62.067, "r_y3": 681.6, "coord_origin": "TOPLEFT"}, "text": "Aiming to train and evaluate our models in a broader", "orig": "Aiming to train and evaluate our models in a broader", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 702.107, "r_x1": 286.365, "r_y1": 702.107, "r_x2": 286.365, "r_y2": 693.5550000000001, "r_x3": 50.112, "r_y3": 693.5550000000001, "coord_origin": "TOPLEFT"}, "text": "spectrum of table data we have synthesized four types of", "orig": "spectrum of table data we have synthesized four types of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 714.062, "r_x1": 84.144, "r_y1": 714.062, "r_x2": 84.144, "r_y2": 705.51, "r_x3": 50.112, "r_y3": 705.51, "coord_origin": "TOPLEFT"}, "text": "datasets.", "orig": "datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.238, "r_y0": 714.062, "r_x1": 286.365, "r_y1": 714.062, "r_x2": 286.365, "r_y2": 705.51, "r_x3": 91.238, "r_y3": 705.51, "coord_origin": "TOPLEFT"}, "text": "Each one contains tables with different appear-", "orig": "Each one contains tables with different appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 171.476, "r_x1": 426.929, "r_y1": 171.476, "r_x2": 426.929, "r_y2": 162.92399999999998, "r_x3": 308.862, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "ances in regard to their size,", "orig": "ances in regard to their size,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.043, "r_y0": 171.476, "r_x1": 468.393, "r_y1": 171.476, "r_x2": 468.393, "r_y2": 162.92399999999998, "r_x3": 431.043, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "structure,", "orig": "structure,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 472.508, "r_y0": 171.476, "r_x1": 491.327, "r_y1": 171.476, "r_x2": 491.327, "r_y2": 162.92399999999998, "r_x3": 472.508, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "style", "orig": "style", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 495.113, "r_y0": 171.476, "r_x1": 545.115, "r_y1": 171.476, "r_x2": 545.115, "r_y2": 162.92399999999998, "r_x3": 495.113, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "and content.", "orig": "and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 183.43100000000004, "r_x1": 545.115, "r_y1": 183.43100000000004, "r_x2": 545.115, "r_y2": 174.87900000000002, "r_x3": 308.862, "r_y3": 174.87900000000002, "coord_origin": "TOPLEFT"}, "text": "Every synthetic dataset contains 150k examples, summing", "orig": "Every synthetic dataset contains 150k examples, summing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 195.38599999999997, "r_x1": 545.115, "r_y1": 195.38599999999997, "r_x2": 545.115, "r_y2": 186.83399999999995, "r_x3": 308.862, "r_y3": 186.83399999999995, "coord_origin": "TOPLEFT"}, "text": "up to 600k synthetic examples. All datasets are divided into", "orig": "up to 600k synthetic examples. All datasets are divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 207.34199999999998, "r_x1": 484.074, "r_y1": 207.34199999999998, "r_x2": 484.074, "r_y2": 198.78999999999996, "r_x3": 308.862, "r_y3": 198.78999999999996, "coord_origin": "TOPLEFT"}, "text": "Train, Test and Val splits (80%, 10%, 10%).", "orig": "Train, Test and Val splits (80%, 10%, 10%).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 220.05600000000004, "r_x1": 545.115, "r_y1": 220.05600000000004, "r_x2": 545.115, "r_y2": 211.50400000000002, "r_x3": 320.817, "r_y3": 211.50400000000002, "coord_origin": "TOPLEFT"}, "text": "The process of generating a synthetic dataset can be de-", "orig": "The process of generating a synthetic dataset can be de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 232.01099999999997, "r_x1": 448.089, "r_y1": 232.01099999999997, "r_x2": 448.089, "r_y2": 223.45899999999995, "r_x3": 308.862, "r_y3": 223.45899999999995, "coord_origin": "TOPLEFT"}, "text": "composed into the following steps:", "orig": "composed into the following steps:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 244.726, "r_x1": 328.289, "r_y1": 244.726, "r_x2": 328.289, "r_y2": 236.17399999999998, "r_x3": 320.817, "r_y3": 236.17399999999998, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 335.382, "r_y0": 244.726, "r_x1": 492.911, "r_y1": 244.726, "r_x2": 492.911, "r_y2": 236.17399999999998, "r_x3": 335.382, "r_y3": 236.17399999999998, "coord_origin": "TOPLEFT"}, "text": "Prepare styling and content templates:", "orig": "Prepare styling and content templates:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.669, "r_y0": 244.726, "r_x1": 545.115, "r_y1": 244.726, "r_x2": 545.115, "r_y2": 236.17399999999998, "r_x3": 498.669, "r_y3": 236.17399999999998, "coord_origin": "TOPLEFT"}, "text": "The styling", "orig": "The styling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 256.68100000000004, "r_x1": 545.115, "r_y1": 256.68100000000004, "r_x2": 545.115, "r_y2": 248.12900000000002, "r_x3": 308.862, "r_y3": 248.12900000000002, "coord_origin": "TOPLEFT"}, "text": "templates have been manually designed and organized into", "orig": "templates have been manually designed and organized into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 268.63599999999997, "r_x1": 481.733, "r_y1": 268.63599999999997, "r_x2": 481.733, "r_y2": 260.08399999999995, "r_x3": 308.862, "r_y3": 260.08399999999995, "coord_origin": "TOPLEFT"}, "text": "groups of scope specific appearances (e.g.", "orig": "groups of scope specific appearances (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.119, "r_y0": 268.63599999999997, "r_x1": 545.115, "r_y1": 268.63599999999997, "r_x2": 545.115, "r_y2": 260.08399999999995, "r_x3": 488.119, "r_y3": 260.08399999999995, "coord_origin": "TOPLEFT"}, "text": "financial data,", "orig": "financial data,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 280.591, "r_x1": 393.385, "r_y1": 280.591, "r_x2": 393.385, "r_y2": 272.039, "r_x3": 308.862, "r_y3": 272.039, "coord_origin": "TOPLEFT"}, "text": "marketing data, etc.)", "orig": "marketing data, etc.)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.119, "r_y0": 280.591, "r_x1": 545.115, "r_y1": 280.591, "r_x2": 545.115, "r_y2": 272.039, "r_x3": 400.119, "r_y3": 272.039, "coord_origin": "TOPLEFT"}, "text": "Additionally, we have prepared cu-", "orig": "Additionally, we have prepared cu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 292.546, "r_x1": 545.115, "r_y1": 292.546, "r_x2": 545.115, "r_y2": 283.994, "r_x3": 308.862, "r_y3": 283.994, "coord_origin": "TOPLEFT"}, "text": "rated collections of content templates by extracting the most", "orig": "rated collections of content templates by extracting the most", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 304.502, "r_x1": 349.808, "r_y1": 304.502, "r_x2": 349.808, "r_y2": 295.95, "r_x3": 308.862, "r_y3": 295.95, "coord_origin": "TOPLEFT"}, "text": "frequently", "orig": "frequently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.152, "r_y0": 304.502, "r_x1": 487.183, "r_y1": 304.502, "r_x2": 487.183, "r_y2": 295.95, "r_x3": 354.152, "r_y3": 295.95, "coord_origin": "TOPLEFT"}, "text": "used terms out of non-synthetic", "orig": "used terms out of non-synthetic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 491.526, "r_y0": 304.502, "r_x1": 523.068, "r_y1": 304.502, "r_x2": 523.068, "r_y2": 295.95, "r_x3": 491.526, "r_y3": 295.95, "coord_origin": "TOPLEFT"}, "text": "datasets", "orig": "datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 527.412, "r_y0": 304.502, "r_x1": 545.115, "r_y1": 304.502, "r_x2": 545.115, "r_y2": 295.95, "r_x3": 527.412, "r_y3": 295.95, "coord_origin": "TOPLEFT"}, "text": "(e.g.", "orig": "(e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 316.457, "r_x1": 425.693, "r_y1": 316.457, "r_x2": 425.693, "r_y2": 307.905, "r_x3": 308.862, "r_y3": 307.905, "coord_origin": "TOPLEFT"}, "text": "PubTabNet, FinTabNet, etc.).", "orig": "PubTabNet, FinTabNet, etc.).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 329.171, "r_x1": 328.289, "r_y1": 329.171, "r_x2": 328.289, "r_y2": 320.619, "r_x3": 320.817, "r_y3": 320.619, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.692, "r_y0": 329.171, "r_x1": 435.377, "r_y1": 329.171, "r_x2": 435.377, "r_y2": 320.619, "r_x3": 332.692, "r_y3": 320.619, "coord_origin": "TOPLEFT"}, "text": "Generate table structures:", "orig": "Generate table structures:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.342, "r_y0": 329.171, "r_x1": 545.115, "r_y1": 329.171, "r_x2": 545.115, "r_y2": 320.619, "r_x3": 439.342, "r_y3": 320.619, "coord_origin": "TOPLEFT"}, "text": "The structure of each syn-", "orig": "The structure of each syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 341.126, "r_x1": 545.115, "r_y1": 341.126, "r_x2": 545.115, "r_y2": 332.574, "r_x3": 308.862, "r_y3": 332.574, "coord_origin": "TOPLEFT"}, "text": "thetic dataset assumes a horizontal table header which po-", "orig": "thetic dataset assumes a horizontal table header which po-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 353.081, "r_x1": 341.519, "r_y1": 353.081, "r_x2": 341.519, "r_y2": 344.529, "r_x3": 308.862, "r_y3": 344.529, "coord_origin": "TOPLEFT"}, "text": "tentially", "orig": "tentially", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.813, "r_y0": 353.081, "r_x1": 427.168, "r_y1": 353.081, "r_x2": 427.168, "r_y2": 344.529, "r_x3": 345.813, "r_y3": 344.529, "coord_origin": "TOPLEFT"}, "text": "spans over multiple", "orig": "spans over multiple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.462, "r_y0": 353.081, "r_x1": 545.115, "r_y1": 353.081, "r_x2": 545.115, "r_y2": 344.529, "r_x3": 431.462, "r_y3": 344.529, "coord_origin": "TOPLEFT"}, "text": "rows and a table body that", "orig": "rows and a table body that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 365.037, "r_x1": 545.115, "r_y1": 365.037, "r_x2": 545.115, "r_y2": 356.485, "r_x3": 308.862, "r_y3": 356.485, "coord_origin": "TOPLEFT"}, "text": "may contain a combination of row spans and column spans.", "orig": "may contain a combination of row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 376.992, "r_x1": 545.115, "r_y1": 376.992, "r_x2": 545.115, "r_y2": 368.44, "r_x3": 308.862, "r_y3": 368.44, "coord_origin": "TOPLEFT"}, "text": "However, spans are not allowed to cross the header - body", "orig": "However, spans are not allowed to cross the header - body", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 388.947, "r_x1": 348.334, "r_y1": 388.947, "r_x2": 348.334, "r_y2": 380.395, "r_x3": 308.862, "r_y3": 380.395, "coord_origin": "TOPLEFT"}, "text": "boundary.", "orig": "boundary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 353.504, "r_y0": 388.947, "r_x1": 545.115, "r_y1": 388.947, "r_x2": 545.115, "r_y2": 380.395, "r_x3": 353.504, "r_y3": 380.395, "coord_origin": "TOPLEFT"}, "text": "The table structure is described by the parame-", "orig": "The table structure is described by the parame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 400.902, "r_x1": 326.018, "r_y1": 400.902, "r_x2": 326.018, "r_y2": 392.35, "r_x3": 308.862, "r_y3": 392.35, "coord_origin": "TOPLEFT"}, "text": "ters:", "orig": "ters:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.909, "r_y0": 400.902, "r_x1": 545.115, "r_y1": 400.902, "r_x2": 545.115, "r_y2": 392.35, "r_x3": 330.909, "r_y3": 392.35, "coord_origin": "TOPLEFT"}, "text": "Total number of table rows and columns, number of", "orig": "Total number of table rows and columns, number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 412.857, "r_x1": 545.115, "r_y1": 412.857, "r_x2": 545.115, "r_y2": 404.305, "r_x3": 308.862, "r_y3": 404.305, "coord_origin": "TOPLEFT"}, "text": "header rows, type of spans (header only spans, row only", "orig": "header rows, type of spans (header only spans, row only", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 424.812, "r_x1": 333.49, "r_y1": 424.812, "r_x2": 333.49, "r_y2": 416.26, "r_x3": 308.862, "r_y3": 416.26, "coord_origin": "TOPLEFT"}, "text": "spans,", "orig": "spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.082, "r_y0": 424.812, "r_x1": 418.66, "r_y1": 424.812, "r_x2": 418.66, "r_y2": 416.26, "r_x3": 338.082, "r_y3": 416.26, "coord_origin": "TOPLEFT"}, "text": "column only spans,", "orig": "column only spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.253, "r_y0": 424.812, "r_x1": 545.115, "r_y1": 424.812, "r_x2": 545.115, "r_y2": 416.26, "r_x3": 423.253, "r_y3": 416.26, "coord_origin": "TOPLEFT"}, "text": "both row and column spans),", "orig": "both row and column spans),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 436.768, "r_x1": 545.115, "r_y1": 436.768, "r_x2": 545.115, "r_y2": 428.216, "r_x3": 308.862, "r_y3": 428.216, "coord_origin": "TOPLEFT"}, "text": "maximum span size and the ratio of the table area covered", "orig": "maximum span size and the ratio of the table area covered", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 448.723, "r_x1": 345.943, "r_y1": 448.723, "r_x2": 345.943, "r_y2": 440.171, "r_x3": 308.862, "r_y3": 440.171, "coord_origin": "TOPLEFT"}, "text": "by spans.", "orig": "by spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 461.437, "r_x1": 485.758, "r_y1": 461.437, "r_x2": 485.758, "r_y2": 452.885, "r_x3": 320.817, "r_y3": 452.885, "coord_origin": "TOPLEFT"}, "text": "3. Generate content: Based on the dataset", "orig": "3. Generate content: Based on the dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.073, "r_y0": 461.294, "r_x1": 511.864, "r_y1": 461.294, "r_x2": 511.864, "r_y2": 452.706, "r_x3": 488.073, "r_y3": 452.706, "coord_origin": "TOPLEFT"}, "text": "theme", "orig": "theme", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 511.863, "r_y0": 461.437, "r_x1": 545.108, "r_y1": 461.437, "r_x2": 545.108, "r_y2": 452.885, "r_x3": 511.863, "r_y3": 452.885, "coord_origin": "TOPLEFT"}, "text": ", a set of", "orig": ", a set of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 473.392, "r_x1": 545.115, "r_y1": 473.392, "r_x2": 545.115, "r_y2": 464.84, "r_x3": 308.862, "r_y3": 464.84, "coord_origin": "TOPLEFT"}, "text": "suitable content templates is chosen first. Then, this content", "orig": "suitable content templates is chosen first. Then, this content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 485.348, "r_x1": 545.115, "r_y1": 485.348, "r_x2": 545.115, "r_y2": 476.796, "r_x3": 308.862, "r_y3": 476.796, "coord_origin": "TOPLEFT"}, "text": "can be combined with purely random text to produce the", "orig": "can be combined with purely random text to produce the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 497.303, "r_x1": 379.148, "r_y1": 497.303, "r_x2": 379.148, "r_y2": 488.751, "r_x3": 308.862, "r_y3": 488.751, "coord_origin": "TOPLEFT"}, "text": "synthetic content.", "orig": "synthetic content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 510.017, "r_x1": 328.289, "r_y1": 510.017, "r_x2": 328.289, "r_y2": 501.465, "r_x3": 320.817, "r_y3": 501.465, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.217, "r_y0": 510.017, "r_x1": 434.082, "r_y1": 510.017, "r_x2": 434.082, "r_y2": 501.465, "r_x3": 334.217, "r_y3": 501.465, "coord_origin": "TOPLEFT"}, "text": "Apply styling templates:", "orig": "Apply styling templates:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.063, "r_y0": 510.017, "r_x1": 545.115, "r_y1": 510.017, "r_x2": 545.115, "r_y2": 501.465, "r_x3": 439.063, "r_y3": 501.465, "coord_origin": "TOPLEFT"}, "text": "Depending on the domain", "orig": "Depending on the domain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 521.972, "r_x1": 406.884, "r_y1": 521.972, "r_x2": 406.884, "r_y2": 513.4200000000001, "r_x3": 308.862, "r_y3": 513.4200000000001, "coord_origin": "TOPLEFT"}, "text": "of the synthetic dataset,", "orig": "of the synthetic dataset,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.019, "r_y0": 521.972, "r_x1": 545.115, "r_y1": 521.972, "r_x2": 545.115, "r_y2": 513.4200000000001, "r_x3": 411.019, "r_y3": 513.4200000000001, "coord_origin": "TOPLEFT"}, "text": "a set of styling templates is first", "orig": "a set of styling templates is first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.928, "r_x1": 384.299, "r_y1": 533.928, "r_x2": 384.299, "r_y2": 525.376, "r_x3": 308.862, "r_y3": 525.376, "coord_origin": "TOPLEFT"}, "text": "manually selected.", "orig": "manually selected.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.253, "r_y0": 533.928, "r_x1": 545.115, "r_y1": 533.928, "r_x2": 545.115, "r_y2": 525.376, "r_x3": 391.253, "r_y3": 525.376, "coord_origin": "TOPLEFT"}, "text": "Then, a style is randomly selected to", "orig": "Then, a style is randomly selected to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.883, "r_x1": 496.159, "r_y1": 545.883, "r_x2": 496.159, "r_y2": 537.331, "r_x3": 308.862, "r_y3": 537.331, "coord_origin": "TOPLEFT"}, "text": "format the appearance of the synthesized table.", "orig": "format the appearance of the synthesized table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 558.597, "r_x1": 328.289, "r_y1": 558.597, "r_x2": 328.289, "r_y2": 550.045, "r_x3": 320.817, "r_y3": 550.045, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 335.402, "r_y0": 558.597, "r_x1": 450.371, "r_y1": 558.597, "r_x2": 450.371, "r_y2": 550.045, "r_x3": 335.402, "r_y3": 550.045, "coord_origin": "TOPLEFT"}, "text": "Render the complete tables:", "orig": "Render the complete tables:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 456.139, "r_y0": 558.597, "r_x1": 545.115, "r_y1": 558.597, "r_x2": 545.115, "r_y2": 550.045, "r_x3": 456.139, "r_y3": 550.045, "coord_origin": "TOPLEFT"}, "text": "The synthetic table is", "orig": "The synthetic table is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 570.552, "r_x1": 334.326, "r_y1": 570.552, "r_x2": 334.326, "r_y2": 562.0, "r_x3": 308.862, "r_y3": 562.0, "coord_origin": "TOPLEFT"}, "text": "finally", "orig": "finally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.983, "r_y0": 570.552, "r_x1": 545.115, "r_y1": 570.552, "r_x2": 545.115, "r_y2": 562.0, "r_x3": 337.983, "r_y3": 562.0, "coord_origin": "TOPLEFT"}, "text": "rendered by a web browser engine to generate the", "orig": "rendered by a web browser engine to generate the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 582.5070000000001, "r_x1": 545.115, "r_y1": 582.5070000000001, "r_x2": 545.115, "r_y2": 573.955, "r_x3": 308.862, "r_y3": 573.955, "coord_origin": "TOPLEFT"}, "text": "bounding boxes for each table cell. A batching technique is", "orig": "bounding boxes for each table cell. A batching technique is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 594.463, "r_x1": 545.115, "r_y1": 594.463, "r_x2": 545.115, "r_y2": 585.9110000000001, "r_x3": 308.862, "r_y3": 585.9110000000001, "coord_origin": "TOPLEFT"}, "text": "utilized to optimize the runtime overhead of the rendering", "orig": "utilized to optimize the runtime overhead of the rendering", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 606.418, "r_x1": 341.23, "r_y1": 606.418, "r_x2": 341.23, "r_y2": 597.866, "r_x3": 308.862, "r_y3": 597.866, "coord_origin": "TOPLEFT"}, "text": "process.", "orig": "process.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 633.039, "r_x1": 317.828, "r_y1": 633.039, "r_x2": 317.828, "r_y2": 622.2909999999999, "r_x3": 308.862, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.591, "r_y0": 633.039, "r_x1": 376.493, "r_y1": 633.039, "r_x2": 376.493, "r_y2": 622.2909999999999, "r_x3": 323.591, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "Prediction", "orig": "Prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.255, "r_y0": 633.039, "r_x1": 461.076, "r_y1": 633.039, "r_x2": 461.076, "r_y2": 622.2909999999999, "r_x3": 382.255, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "post-processing", "orig": "post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.826, "r_y0": 633.039, "r_x1": 481.794, "r_y1": 633.039, "r_x2": 481.794, "r_y2": 622.2909999999999, "r_x3": 466.826, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.556, "r_y0": 633.039, "r_x1": 545.109, "r_y1": 633.039, "r_x2": 545.109, "r_y2": 622.2909999999999, "r_x3": 487.556, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "PDF docu-", "orig": "PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 646.987, "r_x1": 357.341, "r_y1": 646.987, "r_x2": 357.341, "r_y2": 636.239, "r_x3": 326.795, "r_y3": 636.239, "coord_origin": "TOPLEFT"}, "text": "ments", "orig": "ments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 666.242, "r_x1": 545.115, "r_y1": 666.242, "r_x2": 545.115, "r_y2": 657.69, "r_x3": 320.817, "r_y3": 657.69, "coord_origin": "TOPLEFT"}, "text": "Although TableFormer can predict the table structure and", "orig": "Although TableFormer can predict the table structure and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 678.197, "r_x1": 545.115, "r_y1": 678.197, "r_x2": 545.115, "r_y2": 669.645, "r_x3": 308.862, "r_y3": 669.645, "coord_origin": "TOPLEFT"}, "text": "the bounding boxes for tables recognized inside PDF docu-", "orig": "the bounding boxes for tables recognized inside PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 690.152, "r_x1": 545.115, "r_y1": 690.152, "r_x2": 545.115, "r_y2": 681.6, "r_x3": 308.862, "r_y3": 681.6, "coord_origin": "TOPLEFT"}, "text": "ments, this is not enough when a full reconstruction of the", "orig": "ments, this is not enough when a full reconstruction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 702.107, "r_x1": 545.115, "r_y1": 702.107, "r_x2": 545.115, "r_y2": 693.5550000000001, "r_x3": 308.862, "r_y3": 693.5550000000001, "coord_origin": "TOPLEFT"}, "text": "original table is required. This happens mainly due the fol-", "orig": "original table is required. This happens mainly due the fol-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 714.063, "r_x1": 371.427, "r_y1": 714.063, "r_x2": 371.427, "r_y2": 705.511, "r_x3": 308.862, "r_y3": 705.511, "coord_origin": "TOPLEFT"}, "text": "lowing reasons:", "orig": "lowing reasons:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 18, "label": "section_header", "bbox": {"l": 132.842, "t": 110.57500000000005, "r": 465.376, "b": 135.48400000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.6497084498405457, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.842, "r_y0": 121.32299999999998, "r_x1": 465.376, "r_y1": 121.32299999999998, "r_x2": 465.376, "r_y2": 110.57500000000005, "r_x3": 132.842, "r_y3": 110.57500000000005, "coord_origin": "TOPLEFT"}, "text": "TableFormer: Table Structure Understanding with Transformers", "orig": "TableFormer: Table Structure Understanding with Transformers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.184, "r_y0": 135.48400000000004, "r_x1": 375.043, "r_y1": 135.48400000000004, "r_x2": 375.043, "r_y2": 122.42399999999998, "r_x3": 220.184, "r_y3": 122.42399999999998, "coord_origin": "TOPLEFT"}, "text": "Supplementary Material", "orig": "Supplementary Material", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "section_header", "bbox": {"l": 50.112, "t": 161.16099999999994, "r": 175.964, "b": 171.909, "coord_origin": "TOPLEFT"}, "confidence": 0.9454860091209412, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 171.909, "r_x1": 175.964, "r_y1": 171.909, "r_x2": 175.964, "r_y2": 161.16099999999994, "r_x3": 50.112, "r_y3": 161.16099999999994, "coord_origin": "TOPLEFT"}, "text": "1. Details on the datasets", "orig": "1. Details on the datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "section_header", "bbox": {"l": 50.112, "t": 180.97900000000004, "r": 150.364, "b": 190.83100000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9535645842552185, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 190.83100000000002, "r_x1": 150.364, "r_y1": 190.83100000000002, "r_x2": 150.364, "r_y2": 180.97900000000004, "r_x3": 50.112, "r_y3": 180.97900000000004, "coord_origin": "TOPLEFT"}, "text": "1.1. Data preparation", "orig": "1.1. Data preparation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 50.112, "t": 200.18899999999996, "r": 286.365, "b": 388.069, "coord_origin": "TOPLEFT"}, "confidence": 0.9864971041679382, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 208.74099999999999, "r_x1": 286.365, "r_y1": 208.74099999999999, "r_x2": 286.365, "r_y2": 200.18899999999996, "r_x3": 62.067, "r_y3": 200.18899999999996, "coord_origin": "TOPLEFT"}, "text": "As a first step of our data preparation process, we have", "orig": "As a first step of our data preparation process, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 220.697, "r_x1": 286.365, "r_y1": 220.697, "r_x2": 286.365, "r_y2": 212.14499999999998, "r_x3": 50.112, "r_y3": 212.14499999999998, "coord_origin": "TOPLEFT"}, "text": "calculated statistics over the datasets across the following", "orig": "calculated statistics over the datasets across the following", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 232.65200000000004, "r_x1": 286.365, "r_y1": 232.65200000000004, "r_x2": 286.365, "r_y2": 224.10000000000002, "r_x3": 50.112, "r_y3": 224.10000000000002, "coord_origin": "TOPLEFT"}, "text": "dimensions: (1) table size measured in the number of rows", "orig": "dimensions: (1) table size measured in the number of rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 244.60699999999997, "r_x1": 286.365, "r_y1": 244.60699999999997, "r_x2": 286.365, "r_y2": 236.05499999999995, "r_x3": 50.112, "r_y3": 236.05499999999995, "coord_origin": "TOPLEFT"}, "text": "and columns, (2) complexity of the table, (3) strictness of", "orig": "and columns, (2) complexity of the table, (3) strictness of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 256.562, "r_x1": 286.365, "r_y1": 256.562, "r_x2": 286.365, "r_y2": 248.01, "r_x3": 50.112, "r_y3": 248.01, "coord_origin": "TOPLEFT"}, "text": "the provided HTML structure and (4) completeness (i.e. no", "orig": "the provided HTML structure and (4) completeness (i.e. no", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 268.51700000000005, "r_x1": 286.365, "r_y1": 268.51700000000005, "r_x2": 286.365, "r_y2": 259.96500000000003, "r_x3": 50.112, "r_y3": 259.96500000000003, "coord_origin": "TOPLEFT"}, "text": "omitted bounding boxes). Atable is considered to be simple", "orig": "omitted bounding boxes). Atable is considered to be simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 280.472, "r_x1": 286.365, "r_y1": 280.472, "r_x2": 286.365, "r_y2": 271.91999999999996, "r_x3": 50.112, "r_y3": 271.91999999999996, "coord_origin": "TOPLEFT"}, "text": "if it does not contain row spans or column spans. Addition-", "orig": "if it does not contain row spans or column spans. Addition-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 292.428, "r_x1": 286.365, "r_y1": 292.428, "r_x2": 286.365, "r_y2": 283.876, "r_x3": 50.112, "r_y3": 283.876, "coord_origin": "TOPLEFT"}, "text": "ally, a table has a strict HTMLstructure if every row has the", "orig": "ally, a table has a strict HTMLstructure if every row has the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 304.383, "r_x1": 286.365, "r_y1": 304.383, "r_x2": 286.365, "r_y2": 295.831, "r_x3": 50.112, "r_y3": 295.831, "coord_origin": "TOPLEFT"}, "text": "same number of columns after taking into account any row", "orig": "same number of columns after taking into account any row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 316.338, "r_x1": 118.834, "r_y1": 316.338, "r_x2": 118.834, "r_y2": 307.786, "r_x3": 50.112, "r_y3": 307.786, "coord_origin": "TOPLEFT"}, "text": "or column spans.", "orig": "or column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 123.307, "r_y0": 316.338, "r_x1": 286.365, "r_y1": 316.338, "r_x2": 286.365, "r_y2": 307.786, "r_x3": 123.307, "r_y3": 307.786, "coord_origin": "TOPLEFT"}, "text": "Therefore a strict HTML structure looks", "orig": "Therefore a strict HTML structure looks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 328.293, "r_x1": 127.163, "r_y1": 328.293, "r_x2": 127.163, "r_y2": 319.741, "r_x3": 50.112, "r_y3": 319.741, "coord_origin": "TOPLEFT"}, "text": "always rectangular.", "orig": "always rectangular.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 131.257, "r_y0": 328.293, "r_x1": 286.365, "r_y1": 328.293, "r_x2": 286.365, "r_y2": 319.741, "r_x3": 131.257, "r_y3": 319.741, "coord_origin": "TOPLEFT"}, "text": "However, HTML is a lenient encoding", "orig": "However, HTML is a lenient encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 340.248, "r_x1": 95.163, "r_y1": 340.248, "r_x2": 95.163, "r_y2": 331.696, "r_x3": 50.112, "r_y3": 331.696, "coord_origin": "TOPLEFT"}, "text": "format, i.e.", "orig": "format, i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.459, "r_y0": 340.248, "r_x1": 286.365, "r_y1": 340.248, "r_x2": 286.365, "r_y2": 331.696, "r_x3": 101.459, "r_y3": 331.696, "coord_origin": "TOPLEFT"}, "text": "tables with rows of different sizes might still", "orig": "tables with rows of different sizes might still", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 352.204, "r_x1": 257.942, "r_y1": 352.204, "r_x2": 257.942, "r_y2": 343.652, "r_x3": 50.112, "r_y3": 343.652, "coord_origin": "TOPLEFT"}, "text": "be regarded as correct due to implicit display rules.", "orig": "be regarded as correct due to implicit display rules.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.574, "r_y0": 352.204, "r_x1": 286.365, "r_y1": 352.204, "r_x2": 286.365, "r_y2": 343.652, "r_x3": 262.574, "r_y3": 343.652, "coord_origin": "TOPLEFT"}, "text": "These", "orig": "These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 364.159, "r_x1": 286.365, "r_y1": 364.159, "r_x2": 286.365, "r_y2": 355.607, "r_x3": 50.112, "r_y3": 355.607, "coord_origin": "TOPLEFT"}, "text": "implicit rules leave room for ambiguity, which we want to", "orig": "implicit rules leave room for ambiguity, which we want to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 376.114, "r_x1": 286.365, "r_y1": 376.114, "r_x2": 286.365, "r_y2": 367.562, "r_x3": 50.112, "r_y3": 367.562, "coord_origin": "TOPLEFT"}, "text": "avoid. As such, we prefer to have 'strict' tables, i.e. tables", "orig": "avoid. As such, we prefer to have 'strict' tables, i.e. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 388.069, "r_x1": 230.804, "r_y1": 388.069, "r_x2": 230.804, "r_y2": 379.517, "r_x3": 50.112, "r_y3": 379.517, "coord_origin": "TOPLEFT"}, "text": "where every row has exactly the same length.", "orig": "where every row has exactly the same length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "text", "bbox": {"l": 50.112, "t": 391.674, "r": 286.365, "b": 627.374, "coord_origin": "TOPLEFT"}, "confidence": 0.9826022386550903, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 400.226, "r_x1": 236.243, "r_y1": 400.226, "r_x2": 236.243, "r_y2": 391.674, "r_x3": 62.067, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "We have developed a technique that tries", "orig": "We have developed a technique that tries", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.726, "r_y0": 400.226, "r_x1": 248.477, "r_y1": 400.226, "r_x2": 248.477, "r_y2": 391.674, "r_x3": 240.726, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 252.96, "r_y0": 400.226, "r_x1": 277.458, "r_y1": 400.226, "r_x2": 277.458, "r_y2": 391.674, "r_x3": 252.96, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "derive", "orig": "derive", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.942, "r_y0": 400.226, "r_x1": 286.365, "r_y1": 400.226, "r_x2": 286.365, "r_y2": 391.674, "r_x3": 281.942, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 412.181, "r_x1": 223.571, "r_y1": 412.181, "r_x2": 223.571, "r_y2": 403.629, "r_x3": 50.112, "r_y3": 403.629, "coord_origin": "TOPLEFT"}, "text": "missing bounding box out of its neighbors.", "orig": "missing bounding box out of its neighbors.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.004, "r_y0": 412.181, "r_x1": 286.365, "r_y1": 412.181, "r_x2": 286.365, "r_y2": 403.629, "r_x3": 228.004, "r_y3": 403.629, "coord_origin": "TOPLEFT"}, "text": "As a first step,", "orig": "As a first step,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 424.136, "r_x1": 286.365, "r_y1": 424.136, "r_x2": 286.365, "r_y2": 415.584, "r_x3": 50.112, "r_y3": 415.584, "coord_origin": "TOPLEFT"}, "text": "we use the annotation data to generate the most fine-grained", "orig": "we use the annotation data to generate the most fine-grained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 436.092, "r_x1": 189.519, "r_y1": 436.092, "r_x2": 189.519, "r_y2": 427.54, "r_x3": 50.112, "r_y3": 427.54, "coord_origin": "TOPLEFT"}, "text": "grid that covers the table structure.", "orig": "grid that covers the table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.414, "r_y0": 436.092, "r_x1": 286.365, "r_y1": 436.092, "r_x2": 286.365, "r_y2": 427.54, "r_x3": 193.414, "r_y3": 427.54, "coord_origin": "TOPLEFT"}, "text": "In case of strict HTML", "orig": "In case of strict HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 448.047, "r_x1": 286.365, "r_y1": 448.047, "r_x2": 286.365, "r_y2": 439.495, "r_x3": 50.112, "r_y3": 439.495, "coord_origin": "TOPLEFT"}, "text": "tables, all grid squares are associated with some table cell", "orig": "tables, all grid squares are associated with some table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 460.002, "r_x1": 286.365, "r_y1": 460.002, "r_x2": 286.365, "r_y2": 451.45, "r_x3": 50.112, "r_y3": 451.45, "coord_origin": "TOPLEFT"}, "text": "and in the presence of table spans a cell extends across mul-", "orig": "and in the presence of table spans a cell extends across mul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 471.957, "r_x1": 286.365, "r_y1": 471.957, "r_x2": 286.365, "r_y2": 463.405, "r_x3": 50.112, "r_y3": 463.405, "coord_origin": "TOPLEFT"}, "text": "tiple grid squares. When enough bounding boxes are known", "orig": "tiple grid squares. When enough bounding boxes are known", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 483.912, "r_x1": 143.76, "r_y1": 483.912, "r_x2": 143.76, "r_y2": 475.36, "r_x3": 50.112, "r_y3": 475.36, "coord_origin": "TOPLEFT"}, "text": "for a rectangular table,", "orig": "for a rectangular table,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.696, "r_y0": 483.912, "r_x1": 153.235, "r_y1": 483.912, "r_x2": 153.235, "r_y2": 475.36, "r_x3": 147.696, "r_y3": 475.36, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 156.881, "r_y0": 483.912, "r_x1": 163.526, "r_y1": 483.912, "r_x2": 163.526, "r_y2": 475.36, "r_x3": 156.881, "r_y3": 475.36, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.173, "r_y0": 483.912, "r_x1": 286.365, "r_y1": 483.912, "r_x2": 286.365, "r_y2": 475.36, "r_x3": 167.173, "r_y3": 475.36, "coord_origin": "TOPLEFT"}, "text": "possible to compute the geo-", "orig": "possible to compute the geo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 495.867, "r_x1": 286.365, "r_y1": 495.867, "r_x2": 286.365, "r_y2": 487.315, "r_x3": 50.112, "r_y3": 487.315, "coord_origin": "TOPLEFT"}, "text": "metrical border lines between the grid rows and columns.", "orig": "metrical border lines between the grid rows and columns.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 507.823, "r_x1": 286.365, "r_y1": 507.823, "r_x2": 286.365, "r_y2": 499.271, "r_x3": 50.112, "r_y3": 499.271, "coord_origin": "TOPLEFT"}, "text": "Eventually this information is used to generate the missing", "orig": "Eventually this information is used to generate the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 519.778, "r_x1": 286.365, "r_y1": 519.778, "r_x2": 286.365, "r_y2": 511.226, "r_x3": 50.112, "r_y3": 511.226, "coord_origin": "TOPLEFT"}, "text": "bounding boxes. Additionally, the existence of unused grid", "orig": "bounding boxes. Additionally, the existence of unused grid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 531.733, "r_x1": 286.365, "r_y1": 531.733, "r_x2": 286.365, "r_y2": 523.181, "r_x3": 50.112, "r_y3": 523.181, "coord_origin": "TOPLEFT"}, "text": "squares indicates that the table rows have unequal number", "orig": "squares indicates that the table rows have unequal number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 543.688, "r_x1": 286.365, "r_y1": 543.688, "r_x2": 286.365, "r_y2": 535.136, "r_x3": 50.112, "r_y3": 535.136, "coord_origin": "TOPLEFT"}, "text": "of columns and the overall structure is non-strict. The gen-", "orig": "of columns and the overall structure is non-strict. The gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 555.643, "r_x1": 286.365, "r_y1": 555.643, "r_x2": 286.365, "r_y2": 547.091, "r_x3": 50.112, "r_y3": 547.091, "coord_origin": "TOPLEFT"}, "text": "eration of missing bounding boxes for non-strict HTML ta-", "orig": "eration of missing bounding boxes for non-strict HTML ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 567.5989999999999, "r_x1": 257.474, "r_y1": 567.5989999999999, "r_x2": 257.474, "r_y2": 559.047, "r_x3": 50.112, "r_y3": 559.047, "coord_origin": "TOPLEFT"}, "text": "bles is ambiguous and therefore quite challenging.", "orig": "bles is ambiguous and therefore quite challenging.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.949, "r_y0": 567.5989999999999, "r_x1": 286.365, "r_y1": 567.5989999999999, "r_x2": 286.365, "r_y2": 559.047, "r_x3": 263.949, "r_y3": 559.047, "coord_origin": "TOPLEFT"}, "text": "Thus,", "orig": "Thus,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 579.554, "r_x1": 242.251, "r_y1": 579.554, "r_x2": 242.251, "r_y2": 571.002, "r_x3": 50.112, "r_y3": 571.002, "coord_origin": "TOPLEFT"}, "text": "we have decided to simply discard those tables.", "orig": "we have decided to simply discard those tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.714, "r_y0": 579.554, "r_x1": 286.365, "r_y1": 579.554, "r_x2": 286.365, "r_y2": 571.002, "r_x3": 246.714, "r_y3": 571.002, "coord_origin": "TOPLEFT"}, "text": "In case of", "orig": "In case of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 591.509, "r_x1": 286.365, "r_y1": 591.509, "r_x2": 286.365, "r_y2": 582.957, "r_x3": 50.112, "r_y3": 582.957, "coord_origin": "TOPLEFT"}, "text": "PubTabNet we have computed missing bounding boxes for", "orig": "PubTabNet we have computed missing bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 603.4639999999999, "r_x1": 286.365, "r_y1": 603.4639999999999, "r_x2": 286.365, "r_y2": 594.912, "r_x3": 50.112, "r_y3": 594.912, "coord_origin": "TOPLEFT"}, "text": "48% of the simple and 69% of the complex tables. Regard-", "orig": "48% of the simple and 69% of the complex tables. Regard-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 615.419, "r_x1": 286.365, "r_y1": 615.419, "r_x2": 286.365, "r_y2": 606.867, "r_x3": 50.112, "r_y3": 606.867, "coord_origin": "TOPLEFT"}, "text": "ing FinTabNet, 68% of the simple and 98% of the complex", "orig": "ing FinTabNet, 68% of the simple and 98% of the complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 627.374, "r_x1": 242.261, "r_y1": 627.374, "r_x2": 242.261, "r_y2": 618.822, "r_x3": 50.112, "r_y3": 618.822, "coord_origin": "TOPLEFT"}, "text": "tables require the generation of bounding boxes.", "orig": "tables require the generation of bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "text", "bbox": {"l": 50.112, "t": 630.979, "r": 286.365, "b": 651.487, "coord_origin": "TOPLEFT"}, "confidence": 0.9335853457450867, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 639.531, "r_x1": 286.365, "r_y1": 639.531, "r_x2": 286.365, "r_y2": 630.979, "r_x3": 62.067, "r_y3": 630.979, "coord_origin": "TOPLEFT"}, "text": "Figure 7 illustrates the distribution of the tables across", "orig": "Figure 7 illustrates the distribution of the tables across", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 651.487, "r_x1": 179.905, "r_y1": 651.487, "r_x2": 179.905, "r_y2": 642.935, "r_x3": 50.112, "r_y3": 642.935, "coord_origin": "TOPLEFT"}, "text": "different dimensions per dataset.", "orig": "different dimensions per dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "section_header", "bbox": {"l": 50.112, "t": 662.39, "r": 153.608, "b": 672.242, "coord_origin": "TOPLEFT"}, "confidence": 0.9515743255615234, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 672.242, "r_x1": 153.608, "r_y1": 672.242, "r_x2": 153.608, "r_y2": 662.39, "r_x3": 50.112, "r_y3": 662.39, "coord_origin": "TOPLEFT"}, "text": "1.2. Synthetic datasets", "orig": "1.2. Synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 50.112, "t": 681.6, "r": 286.365, "b": 714.062, "coord_origin": "TOPLEFT"}, "confidence": 0.9783332347869873, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 690.152, "r_x1": 286.365, "r_y1": 690.152, "r_x2": 286.365, "r_y2": 681.6, "r_x3": 62.067, "r_y3": 681.6, "coord_origin": "TOPLEFT"}, "text": "Aiming to train and evaluate our models in a broader", "orig": "Aiming to train and evaluate our models in a broader", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 702.107, "r_x1": 286.365, "r_y1": 702.107, "r_x2": 286.365, "r_y2": 693.5550000000001, "r_x3": 50.112, "r_y3": 693.5550000000001, "coord_origin": "TOPLEFT"}, "text": "spectrum of table data we have synthesized four types of", "orig": "spectrum of table data we have synthesized four types of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 714.062, "r_x1": 84.144, "r_y1": 714.062, "r_x2": 84.144, "r_y2": 705.51, "r_x3": 50.112, "r_y3": 705.51, "coord_origin": "TOPLEFT"}, "text": "datasets.", "orig": "datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.238, "r_y0": 714.062, "r_x1": 286.365, "r_y1": 714.062, "r_x2": 286.365, "r_y2": 705.51, "r_x3": 91.238, "r_y3": 705.51, "coord_origin": "TOPLEFT"}, "text": "Each one contains tables with different appear-", "orig": "Each one contains tables with different appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "text", "bbox": {"l": 308.862, "t": 162.92399999999998, "r": 545.115, "b": 207.34199999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9596064686775208, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 171.476, "r_x1": 426.929, "r_y1": 171.476, "r_x2": 426.929, "r_y2": 162.92399999999998, "r_x3": 308.862, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "ances in regard to their size,", "orig": "ances in regard to their size,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.043, "r_y0": 171.476, "r_x1": 468.393, "r_y1": 171.476, "r_x2": 468.393, "r_y2": 162.92399999999998, "r_x3": 431.043, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "structure,", "orig": "structure,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 472.508, "r_y0": 171.476, "r_x1": 491.327, "r_y1": 171.476, "r_x2": 491.327, "r_y2": 162.92399999999998, "r_x3": 472.508, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "style", "orig": "style", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 495.113, "r_y0": 171.476, "r_x1": 545.115, "r_y1": 171.476, "r_x2": 545.115, "r_y2": 162.92399999999998, "r_x3": 495.113, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "and content.", "orig": "and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 183.43100000000004, "r_x1": 545.115, "r_y1": 183.43100000000004, "r_x2": 545.115, "r_y2": 174.87900000000002, "r_x3": 308.862, "r_y3": 174.87900000000002, "coord_origin": "TOPLEFT"}, "text": "Every synthetic dataset contains 150k examples, summing", "orig": "Every synthetic dataset contains 150k examples, summing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 195.38599999999997, "r_x1": 545.115, "r_y1": 195.38599999999997, "r_x2": 545.115, "r_y2": 186.83399999999995, "r_x3": 308.862, "r_y3": 186.83399999999995, "coord_origin": "TOPLEFT"}, "text": "up to 600k synthetic examples. All datasets are divided into", "orig": "up to 600k synthetic examples. All datasets are divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 207.34199999999998, "r_x1": 484.074, "r_y1": 207.34199999999998, "r_x2": 484.074, "r_y2": 198.78999999999996, "r_x3": 308.862, "r_y3": 198.78999999999996, "coord_origin": "TOPLEFT"}, "text": "Train, Test and Val splits (80%, 10%, 10%).", "orig": "Train, Test and Val splits (80%, 10%, 10%).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "text", "bbox": {"l": 308.862, "t": 211.50400000000002, "r": 545.115, "b": 232.01099999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.9261796474456787, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 220.05600000000004, "r_x1": 545.115, "r_y1": 220.05600000000004, "r_x2": 545.115, "r_y2": 211.50400000000002, "r_x3": 320.817, "r_y3": 211.50400000000002, "coord_origin": "TOPLEFT"}, "text": "The process of generating a synthetic dataset can be de-", "orig": "The process of generating a synthetic dataset can be de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 232.01099999999997, "r_x1": 448.089, "r_y1": 232.01099999999997, "r_x2": 448.089, "r_y2": 223.45899999999995, "r_x3": 308.862, "r_y3": 223.45899999999995, "coord_origin": "TOPLEFT"}, "text": "composed into the following steps:", "orig": "composed into the following steps:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "list_item", "bbox": {"l": 308.862, "t": 236.17399999999998, "r": 545.115, "b": 316.457, "coord_origin": "TOPLEFT"}, "confidence": 0.9642952680587769, "cells": [{"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 244.726, "r_x1": 328.289, "r_y1": 244.726, "r_x2": 328.289, "r_y2": 236.17399999999998, "r_x3": 320.817, "r_y3": 236.17399999999998, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 335.382, "r_y0": 244.726, "r_x1": 492.911, "r_y1": 244.726, "r_x2": 492.911, "r_y2": 236.17399999999998, "r_x3": 335.382, "r_y3": 236.17399999999998, "coord_origin": "TOPLEFT"}, "text": "Prepare styling and content templates:", "orig": "Prepare styling and content templates:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.669, "r_y0": 244.726, "r_x1": 545.115, "r_y1": 244.726, "r_x2": 545.115, "r_y2": 236.17399999999998, "r_x3": 498.669, "r_y3": 236.17399999999998, "coord_origin": "TOPLEFT"}, "text": "The styling", "orig": "The styling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 256.68100000000004, "r_x1": 545.115, "r_y1": 256.68100000000004, "r_x2": 545.115, "r_y2": 248.12900000000002, "r_x3": 308.862, "r_y3": 248.12900000000002, "coord_origin": "TOPLEFT"}, "text": "templates have been manually designed and organized into", "orig": "templates have been manually designed and organized into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 268.63599999999997, "r_x1": 481.733, "r_y1": 268.63599999999997, "r_x2": 481.733, "r_y2": 260.08399999999995, "r_x3": 308.862, "r_y3": 260.08399999999995, "coord_origin": "TOPLEFT"}, "text": "groups of scope specific appearances (e.g.", "orig": "groups of scope specific appearances (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.119, "r_y0": 268.63599999999997, "r_x1": 545.115, "r_y1": 268.63599999999997, "r_x2": 545.115, "r_y2": 260.08399999999995, "r_x3": 488.119, "r_y3": 260.08399999999995, "coord_origin": "TOPLEFT"}, "text": "financial data,", "orig": "financial data,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 280.591, "r_x1": 393.385, "r_y1": 280.591, "r_x2": 393.385, "r_y2": 272.039, "r_x3": 308.862, "r_y3": 272.039, "coord_origin": "TOPLEFT"}, "text": "marketing data, etc.)", "orig": "marketing data, etc.)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.119, "r_y0": 280.591, "r_x1": 545.115, "r_y1": 280.591, "r_x2": 545.115, "r_y2": 272.039, "r_x3": 400.119, "r_y3": 272.039, "coord_origin": "TOPLEFT"}, "text": "Additionally, we have prepared cu-", "orig": "Additionally, we have prepared cu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 292.546, "r_x1": 545.115, "r_y1": 292.546, "r_x2": 545.115, "r_y2": 283.994, "r_x3": 308.862, "r_y3": 283.994, "coord_origin": "TOPLEFT"}, "text": "rated collections of content templates by extracting the most", "orig": "rated collections of content templates by extracting the most", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 304.502, "r_x1": 349.808, "r_y1": 304.502, "r_x2": 349.808, "r_y2": 295.95, "r_x3": 308.862, "r_y3": 295.95, "coord_origin": "TOPLEFT"}, "text": "frequently", "orig": "frequently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.152, "r_y0": 304.502, "r_x1": 487.183, "r_y1": 304.502, "r_x2": 487.183, "r_y2": 295.95, "r_x3": 354.152, "r_y3": 295.95, "coord_origin": "TOPLEFT"}, "text": "used terms out of non-synthetic", "orig": "used terms out of non-synthetic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 491.526, "r_y0": 304.502, "r_x1": 523.068, "r_y1": 304.502, "r_x2": 523.068, "r_y2": 295.95, "r_x3": 491.526, "r_y3": 295.95, "coord_origin": "TOPLEFT"}, "text": "datasets", "orig": "datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 527.412, "r_y0": 304.502, "r_x1": 545.115, "r_y1": 304.502, "r_x2": 545.115, "r_y2": 295.95, "r_x3": 527.412, "r_y3": 295.95, "coord_origin": "TOPLEFT"}, "text": "(e.g.", "orig": "(e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 316.457, "r_x1": 425.693, "r_y1": 316.457, "r_x2": 425.693, "r_y2": 307.905, "r_x3": 308.862, "r_y3": 307.905, "coord_origin": "TOPLEFT"}, "text": "PubTabNet, FinTabNet, etc.).", "orig": "PubTabNet, FinTabNet, etc.).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "list_item", "bbox": {"l": 308.862, "t": 320.619, "r": 545.115, "b": 448.723, "coord_origin": "TOPLEFT"}, "confidence": 0.9699994921684265, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 329.171, "r_x1": 328.289, "r_y1": 329.171, "r_x2": 328.289, "r_y2": 320.619, "r_x3": 320.817, "r_y3": 320.619, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.692, "r_y0": 329.171, "r_x1": 435.377, "r_y1": 329.171, "r_x2": 435.377, "r_y2": 320.619, "r_x3": 332.692, "r_y3": 320.619, "coord_origin": "TOPLEFT"}, "text": "Generate table structures:", "orig": "Generate table structures:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.342, "r_y0": 329.171, "r_x1": 545.115, "r_y1": 329.171, "r_x2": 545.115, "r_y2": 320.619, "r_x3": 439.342, "r_y3": 320.619, "coord_origin": "TOPLEFT"}, "text": "The structure of each syn-", "orig": "The structure of each syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 341.126, "r_x1": 545.115, "r_y1": 341.126, "r_x2": 545.115, "r_y2": 332.574, "r_x3": 308.862, "r_y3": 332.574, "coord_origin": "TOPLEFT"}, "text": "thetic dataset assumes a horizontal table header which po-", "orig": "thetic dataset assumes a horizontal table header which po-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 353.081, "r_x1": 341.519, "r_y1": 353.081, "r_x2": 341.519, "r_y2": 344.529, "r_x3": 308.862, "r_y3": 344.529, "coord_origin": "TOPLEFT"}, "text": "tentially", "orig": "tentially", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.813, "r_y0": 353.081, "r_x1": 427.168, "r_y1": 353.081, "r_x2": 427.168, "r_y2": 344.529, "r_x3": 345.813, "r_y3": 344.529, "coord_origin": "TOPLEFT"}, "text": "spans over multiple", "orig": "spans over multiple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.462, "r_y0": 353.081, "r_x1": 545.115, "r_y1": 353.081, "r_x2": 545.115, "r_y2": 344.529, "r_x3": 431.462, "r_y3": 344.529, "coord_origin": "TOPLEFT"}, "text": "rows and a table body that", "orig": "rows and a table body that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 365.037, "r_x1": 545.115, "r_y1": 365.037, "r_x2": 545.115, "r_y2": 356.485, "r_x3": 308.862, "r_y3": 356.485, "coord_origin": "TOPLEFT"}, "text": "may contain a combination of row spans and column spans.", "orig": "may contain a combination of row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 376.992, "r_x1": 545.115, "r_y1": 376.992, "r_x2": 545.115, "r_y2": 368.44, "r_x3": 308.862, "r_y3": 368.44, "coord_origin": "TOPLEFT"}, "text": "However, spans are not allowed to cross the header - body", "orig": "However, spans are not allowed to cross the header - body", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 388.947, "r_x1": 348.334, "r_y1": 388.947, "r_x2": 348.334, "r_y2": 380.395, "r_x3": 308.862, "r_y3": 380.395, "coord_origin": "TOPLEFT"}, "text": "boundary.", "orig": "boundary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 353.504, "r_y0": 388.947, "r_x1": 545.115, "r_y1": 388.947, "r_x2": 545.115, "r_y2": 380.395, "r_x3": 353.504, "r_y3": 380.395, "coord_origin": "TOPLEFT"}, "text": "The table structure is described by the parame-", "orig": "The table structure is described by the parame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 400.902, "r_x1": 326.018, "r_y1": 400.902, "r_x2": 326.018, "r_y2": 392.35, "r_x3": 308.862, "r_y3": 392.35, "coord_origin": "TOPLEFT"}, "text": "ters:", "orig": "ters:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.909, "r_y0": 400.902, "r_x1": 545.115, "r_y1": 400.902, "r_x2": 545.115, "r_y2": 392.35, "r_x3": 330.909, "r_y3": 392.35, "coord_origin": "TOPLEFT"}, "text": "Total number of table rows and columns, number of", "orig": "Total number of table rows and columns, number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 412.857, "r_x1": 545.115, "r_y1": 412.857, "r_x2": 545.115, "r_y2": 404.305, "r_x3": 308.862, "r_y3": 404.305, "coord_origin": "TOPLEFT"}, "text": "header rows, type of spans (header only spans, row only", "orig": "header rows, type of spans (header only spans, row only", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 424.812, "r_x1": 333.49, "r_y1": 424.812, "r_x2": 333.49, "r_y2": 416.26, "r_x3": 308.862, "r_y3": 416.26, "coord_origin": "TOPLEFT"}, "text": "spans,", "orig": "spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.082, "r_y0": 424.812, "r_x1": 418.66, "r_y1": 424.812, "r_x2": 418.66, "r_y2": 416.26, "r_x3": 338.082, "r_y3": 416.26, "coord_origin": "TOPLEFT"}, "text": "column only spans,", "orig": "column only spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.253, "r_y0": 424.812, "r_x1": 545.115, "r_y1": 424.812, "r_x2": 545.115, "r_y2": 416.26, "r_x3": 423.253, "r_y3": 416.26, "coord_origin": "TOPLEFT"}, "text": "both row and column spans),", "orig": "both row and column spans),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 436.768, "r_x1": 545.115, "r_y1": 436.768, "r_x2": 545.115, "r_y2": 428.216, "r_x3": 308.862, "r_y3": 428.216, "coord_origin": "TOPLEFT"}, "text": "maximum span size and the ratio of the table area covered", "orig": "maximum span size and the ratio of the table area covered", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 448.723, "r_x1": 345.943, "r_y1": 448.723, "r_x2": 345.943, "r_y2": 440.171, "r_x3": 308.862, "r_y3": 440.171, "coord_origin": "TOPLEFT"}, "text": "by spans.", "orig": "by spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "list_item", "bbox": {"l": 308.862, "t": 452.706, "r": 545.115, "b": 497.303, "coord_origin": "TOPLEFT"}, "confidence": 0.9568928480148315, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 461.437, "r_x1": 485.758, "r_y1": 461.437, "r_x2": 485.758, "r_y2": 452.885, "r_x3": 320.817, "r_y3": 452.885, "coord_origin": "TOPLEFT"}, "text": "3. Generate content: Based on the dataset", "orig": "3. Generate content: Based on the dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.073, "r_y0": 461.294, "r_x1": 511.864, "r_y1": 461.294, "r_x2": 511.864, "r_y2": 452.706, "r_x3": 488.073, "r_y3": 452.706, "coord_origin": "TOPLEFT"}, "text": "theme", "orig": "theme", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 511.863, "r_y0": 461.437, "r_x1": 545.108, "r_y1": 461.437, "r_x2": 545.108, "r_y2": 452.885, "r_x3": 511.863, "r_y3": 452.885, "coord_origin": "TOPLEFT"}, "text": ", a set of", "orig": ", a set of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 473.392, "r_x1": 545.115, "r_y1": 473.392, "r_x2": 545.115, "r_y2": 464.84, "r_x3": 308.862, "r_y3": 464.84, "coord_origin": "TOPLEFT"}, "text": "suitable content templates is chosen first. Then, this content", "orig": "suitable content templates is chosen first. Then, this content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 485.348, "r_x1": 545.115, "r_y1": 485.348, "r_x2": 545.115, "r_y2": 476.796, "r_x3": 308.862, "r_y3": 476.796, "coord_origin": "TOPLEFT"}, "text": "can be combined with purely random text to produce the", "orig": "can be combined with purely random text to produce the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 497.303, "r_x1": 379.148, "r_y1": 497.303, "r_x2": 379.148, "r_y2": 488.751, "r_x3": 308.862, "r_y3": 488.751, "coord_origin": "TOPLEFT"}, "text": "synthetic content.", "orig": "synthetic content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "list_item", "bbox": {"l": 308.862, "t": 501.465, "r": 545.115, "b": 545.883, "coord_origin": "TOPLEFT"}, "confidence": 0.9710659980773926, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 510.017, "r_x1": 328.289, "r_y1": 510.017, "r_x2": 328.289, "r_y2": 501.465, "r_x3": 320.817, "r_y3": 501.465, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.217, "r_y0": 510.017, "r_x1": 434.082, "r_y1": 510.017, "r_x2": 434.082, "r_y2": 501.465, "r_x3": 334.217, "r_y3": 501.465, "coord_origin": "TOPLEFT"}, "text": "Apply styling templates:", "orig": "Apply styling templates:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.063, "r_y0": 510.017, "r_x1": 545.115, "r_y1": 510.017, "r_x2": 545.115, "r_y2": 501.465, "r_x3": 439.063, "r_y3": 501.465, "coord_origin": "TOPLEFT"}, "text": "Depending on the domain", "orig": "Depending on the domain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 521.972, "r_x1": 406.884, "r_y1": 521.972, "r_x2": 406.884, "r_y2": 513.4200000000001, "r_x3": 308.862, "r_y3": 513.4200000000001, "coord_origin": "TOPLEFT"}, "text": "of the synthetic dataset,", "orig": "of the synthetic dataset,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.019, "r_y0": 521.972, "r_x1": 545.115, "r_y1": 521.972, "r_x2": 545.115, "r_y2": 513.4200000000001, "r_x3": 411.019, "r_y3": 513.4200000000001, "coord_origin": "TOPLEFT"}, "text": "a set of styling templates is first", "orig": "a set of styling templates is first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.928, "r_x1": 384.299, "r_y1": 533.928, "r_x2": 384.299, "r_y2": 525.376, "r_x3": 308.862, "r_y3": 525.376, "coord_origin": "TOPLEFT"}, "text": "manually selected.", "orig": "manually selected.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.253, "r_y0": 533.928, "r_x1": 545.115, "r_y1": 533.928, "r_x2": 545.115, "r_y2": 525.376, "r_x3": 391.253, "r_y3": 525.376, "coord_origin": "TOPLEFT"}, "text": "Then, a style is randomly selected to", "orig": "Then, a style is randomly selected to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.883, "r_x1": 496.159, "r_y1": 545.883, "r_x2": 496.159, "r_y2": 537.331, "r_x3": 308.862, "r_y3": 537.331, "coord_origin": "TOPLEFT"}, "text": "format the appearance of the synthesized table.", "orig": "format the appearance of the synthesized table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "list_item", "bbox": {"l": 308.862, "t": 550.045, "r": 545.115, "b": 606.418, "coord_origin": "TOPLEFT"}, "confidence": 0.9778757095336914, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 558.597, "r_x1": 328.289, "r_y1": 558.597, "r_x2": 328.289, "r_y2": 550.045, "r_x3": 320.817, "r_y3": 550.045, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 335.402, "r_y0": 558.597, "r_x1": 450.371, "r_y1": 558.597, "r_x2": 450.371, "r_y2": 550.045, "r_x3": 335.402, "r_y3": 550.045, "coord_origin": "TOPLEFT"}, "text": "Render the complete tables:", "orig": "Render the complete tables:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 456.139, "r_y0": 558.597, "r_x1": 545.115, "r_y1": 558.597, "r_x2": 545.115, "r_y2": 550.045, "r_x3": 456.139, "r_y3": 550.045, "coord_origin": "TOPLEFT"}, "text": "The synthetic table is", "orig": "The synthetic table is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 570.552, "r_x1": 334.326, "r_y1": 570.552, "r_x2": 334.326, "r_y2": 562.0, "r_x3": 308.862, "r_y3": 562.0, "coord_origin": "TOPLEFT"}, "text": "finally", "orig": "finally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.983, "r_y0": 570.552, "r_x1": 545.115, "r_y1": 570.552, "r_x2": 545.115, "r_y2": 562.0, "r_x3": 337.983, "r_y3": 562.0, "coord_origin": "TOPLEFT"}, "text": "rendered by a web browser engine to generate the", "orig": "rendered by a web browser engine to generate the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 582.5070000000001, "r_x1": 545.115, "r_y1": 582.5070000000001, "r_x2": 545.115, "r_y2": 573.955, "r_x3": 308.862, "r_y3": 573.955, "coord_origin": "TOPLEFT"}, "text": "bounding boxes for each table cell. A batching technique is", "orig": "bounding boxes for each table cell. A batching technique is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 594.463, "r_x1": 545.115, "r_y1": 594.463, "r_x2": 545.115, "r_y2": 585.9110000000001, "r_x3": 308.862, "r_y3": 585.9110000000001, "coord_origin": "TOPLEFT"}, "text": "utilized to optimize the runtime overhead of the rendering", "orig": "utilized to optimize the runtime overhead of the rendering", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 606.418, "r_x1": 341.23, "r_y1": 606.418, "r_x2": 341.23, "r_y2": 597.866, "r_x3": 308.862, "r_y3": 597.866, "coord_origin": "TOPLEFT"}, "text": "process.", "orig": "process.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 10, "label": "section_header", "bbox": {"l": 308.862, "t": 622.2909999999999, "r": 545.109, "b": 646.987, "coord_origin": "TOPLEFT"}, "confidence": 0.954940915107727, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 633.039, "r_x1": 317.828, "r_y1": 633.039, "r_x2": 317.828, "r_y2": 622.2909999999999, "r_x3": 308.862, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.591, "r_y0": 633.039, "r_x1": 376.493, "r_y1": 633.039, "r_x2": 376.493, "r_y2": 622.2909999999999, "r_x3": 323.591, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "Prediction", "orig": "Prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.255, "r_y0": 633.039, "r_x1": 461.076, "r_y1": 633.039, "r_x2": 461.076, "r_y2": 622.2909999999999, "r_x3": 382.255, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "post-processing", "orig": "post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.826, "r_y0": 633.039, "r_x1": 481.794, "r_y1": 633.039, "r_x2": 481.794, "r_y2": 622.2909999999999, "r_x3": 466.826, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.556, "r_y0": 633.039, "r_x1": 545.109, "r_y1": 633.039, "r_x2": 545.109, "r_y2": 622.2909999999999, "r_x3": 487.556, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "PDF docu-", "orig": "PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 646.987, "r_x1": 357.341, "r_y1": 646.987, "r_x2": 357.341, "r_y2": 636.239, "r_x3": 326.795, "r_y3": 636.239, "coord_origin": "TOPLEFT"}, "text": "ments", "orig": "ments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 308.862, "t": 657.69, "r": 545.115, "b": 714.063, "coord_origin": "TOPLEFT"}, "confidence": 0.9829329252243042, "cells": [{"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 666.242, "r_x1": 545.115, "r_y1": 666.242, "r_x2": 545.115, "r_y2": 657.69, "r_x3": 320.817, "r_y3": 657.69, "coord_origin": "TOPLEFT"}, "text": "Although TableFormer can predict the table structure and", "orig": "Although TableFormer can predict the table structure and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 678.197, "r_x1": 545.115, "r_y1": 678.197, "r_x2": 545.115, "r_y2": 669.645, "r_x3": 308.862, "r_y3": 669.645, "coord_origin": "TOPLEFT"}, "text": "the bounding boxes for tables recognized inside PDF docu-", "orig": "the bounding boxes for tables recognized inside PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 690.152, "r_x1": 545.115, "r_y1": 690.152, "r_x2": 545.115, "r_y2": 681.6, "r_x3": 308.862, "r_y3": 681.6, "coord_origin": "TOPLEFT"}, "text": "ments, this is not enough when a full reconstruction of the", "orig": "ments, this is not enough when a full reconstruction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 702.107, "r_x1": 545.115, "r_y1": 702.107, "r_x2": 545.115, "r_y2": 693.5550000000001, "r_x3": 308.862, "r_y3": 693.5550000000001, "coord_origin": "TOPLEFT"}, "text": "original table is required. This happens mainly due the fol-", "orig": "original table is required. This happens mainly due the fol-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 714.063, "r_x1": 371.427, "r_y1": 714.063, "r_x2": 371.427, "r_y2": 705.511, "r_x3": 308.862, "r_y3": 705.511, "coord_origin": "TOPLEFT"}, "text": "lowing reasons:", "orig": "lowing reasons:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8986663222312927, "cells": [{"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "section_header", "id": 18, "page_no": 10, "cluster": {"id": 18, "label": "section_header", "bbox": {"l": 132.842, "t": 110.57500000000005, "r": 465.376, "b": 135.48400000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.6497084498405457, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.842, "r_y0": 121.32299999999998, "r_x1": 465.376, "r_y1": 121.32299999999998, "r_x2": 465.376, "r_y2": 110.57500000000005, "r_x3": 132.842, "r_y3": 110.57500000000005, "coord_origin": "TOPLEFT"}, "text": "TableFormer: Table Structure Understanding with Transformers", "orig": "TableFormer: Table Structure Understanding with Transformers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.184, "r_y0": 135.48400000000004, "r_x1": 375.043, "r_y1": 135.48400000000004, "r_x2": 375.043, "r_y2": 122.42399999999998, "r_x3": 220.184, "r_y3": 122.42399999999998, "coord_origin": "TOPLEFT"}, "text": "Supplementary Material", "orig": "Supplementary Material", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TableFormer: Table Structure Understanding with Transformers Supplementary Material"}, {"label": "section_header", "id": 13, "page_no": 10, "cluster": {"id": 13, "label": "section_header", "bbox": {"l": 50.112, "t": 161.16099999999994, "r": 175.964, "b": 171.909, "coord_origin": "TOPLEFT"}, "confidence": 0.9454860091209412, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 171.909, "r_x1": 175.964, "r_y1": 171.909, "r_x2": 175.964, "r_y2": 161.16099999999994, "r_x3": 50.112, "r_y3": 161.16099999999994, "coord_origin": "TOPLEFT"}, "text": "1. Details on the datasets", "orig": "1. Details on the datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1. Details on the datasets"}, {"label": "section_header", "id": 11, "page_no": 10, "cluster": {"id": 11, "label": "section_header", "bbox": {"l": 50.112, "t": 180.97900000000004, "r": 150.364, "b": 190.83100000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9535645842552185, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 190.83100000000002, "r_x1": 150.364, "r_y1": 190.83100000000002, "r_x2": 150.364, "r_y2": 180.97900000000004, "r_x3": 50.112, "r_y3": 180.97900000000004, "coord_origin": "TOPLEFT"}, "text": "1.1. Data preparation", "orig": "1.1. Data preparation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1.1. Data preparation"}, {"label": "text", "id": 0, "page_no": 10, "cluster": {"id": 0, "label": "text", "bbox": {"l": 50.112, "t": 200.18899999999996, "r": 286.365, "b": 388.069, "coord_origin": "TOPLEFT"}, "confidence": 0.9864971041679382, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 208.74099999999999, "r_x1": 286.365, "r_y1": 208.74099999999999, "r_x2": 286.365, "r_y2": 200.18899999999996, "r_x3": 62.067, "r_y3": 200.18899999999996, "coord_origin": "TOPLEFT"}, "text": "As a first step of our data preparation process, we have", "orig": "As a first step of our data preparation process, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 220.697, "r_x1": 286.365, "r_y1": 220.697, "r_x2": 286.365, "r_y2": 212.14499999999998, "r_x3": 50.112, "r_y3": 212.14499999999998, "coord_origin": "TOPLEFT"}, "text": "calculated statistics over the datasets across the following", "orig": "calculated statistics over the datasets across the following", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 232.65200000000004, "r_x1": 286.365, "r_y1": 232.65200000000004, "r_x2": 286.365, "r_y2": 224.10000000000002, "r_x3": 50.112, "r_y3": 224.10000000000002, "coord_origin": "TOPLEFT"}, "text": "dimensions: (1) table size measured in the number of rows", "orig": "dimensions: (1) table size measured in the number of rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 244.60699999999997, "r_x1": 286.365, "r_y1": 244.60699999999997, "r_x2": 286.365, "r_y2": 236.05499999999995, "r_x3": 50.112, "r_y3": 236.05499999999995, "coord_origin": "TOPLEFT"}, "text": "and columns, (2) complexity of the table, (3) strictness of", "orig": "and columns, (2) complexity of the table, (3) strictness of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 256.562, "r_x1": 286.365, "r_y1": 256.562, "r_x2": 286.365, "r_y2": 248.01, "r_x3": 50.112, "r_y3": 248.01, "coord_origin": "TOPLEFT"}, "text": "the provided HTML structure and (4) completeness (i.e. no", "orig": "the provided HTML structure and (4) completeness (i.e. no", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 268.51700000000005, "r_x1": 286.365, "r_y1": 268.51700000000005, "r_x2": 286.365, "r_y2": 259.96500000000003, "r_x3": 50.112, "r_y3": 259.96500000000003, "coord_origin": "TOPLEFT"}, "text": "omitted bounding boxes). Atable is considered to be simple", "orig": "omitted bounding boxes). Atable is considered to be simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 280.472, "r_x1": 286.365, "r_y1": 280.472, "r_x2": 286.365, "r_y2": 271.91999999999996, "r_x3": 50.112, "r_y3": 271.91999999999996, "coord_origin": "TOPLEFT"}, "text": "if it does not contain row spans or column spans. Addition-", "orig": "if it does not contain row spans or column spans. Addition-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 292.428, "r_x1": 286.365, "r_y1": 292.428, "r_x2": 286.365, "r_y2": 283.876, "r_x3": 50.112, "r_y3": 283.876, "coord_origin": "TOPLEFT"}, "text": "ally, a table has a strict HTMLstructure if every row has the", "orig": "ally, a table has a strict HTMLstructure if every row has the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 304.383, "r_x1": 286.365, "r_y1": 304.383, "r_x2": 286.365, "r_y2": 295.831, "r_x3": 50.112, "r_y3": 295.831, "coord_origin": "TOPLEFT"}, "text": "same number of columns after taking into account any row", "orig": "same number of columns after taking into account any row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 316.338, "r_x1": 118.834, "r_y1": 316.338, "r_x2": 118.834, "r_y2": 307.786, "r_x3": 50.112, "r_y3": 307.786, "coord_origin": "TOPLEFT"}, "text": "or column spans.", "orig": "or column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 123.307, "r_y0": 316.338, "r_x1": 286.365, "r_y1": 316.338, "r_x2": 286.365, "r_y2": 307.786, "r_x3": 123.307, "r_y3": 307.786, "coord_origin": "TOPLEFT"}, "text": "Therefore a strict HTML structure looks", "orig": "Therefore a strict HTML structure looks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 328.293, "r_x1": 127.163, "r_y1": 328.293, "r_x2": 127.163, "r_y2": 319.741, "r_x3": 50.112, "r_y3": 319.741, "coord_origin": "TOPLEFT"}, "text": "always rectangular.", "orig": "always rectangular.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 131.257, "r_y0": 328.293, "r_x1": 286.365, "r_y1": 328.293, "r_x2": 286.365, "r_y2": 319.741, "r_x3": 131.257, "r_y3": 319.741, "coord_origin": "TOPLEFT"}, "text": "However, HTML is a lenient encoding", "orig": "However, HTML is a lenient encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 340.248, "r_x1": 95.163, "r_y1": 340.248, "r_x2": 95.163, "r_y2": 331.696, "r_x3": 50.112, "r_y3": 331.696, "coord_origin": "TOPLEFT"}, "text": "format, i.e.", "orig": "format, i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.459, "r_y0": 340.248, "r_x1": 286.365, "r_y1": 340.248, "r_x2": 286.365, "r_y2": 331.696, "r_x3": 101.459, "r_y3": 331.696, "coord_origin": "TOPLEFT"}, "text": "tables with rows of different sizes might still", "orig": "tables with rows of different sizes might still", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 352.204, "r_x1": 257.942, "r_y1": 352.204, "r_x2": 257.942, "r_y2": 343.652, "r_x3": 50.112, "r_y3": 343.652, "coord_origin": "TOPLEFT"}, "text": "be regarded as correct due to implicit display rules.", "orig": "be regarded as correct due to implicit display rules.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.574, "r_y0": 352.204, "r_x1": 286.365, "r_y1": 352.204, "r_x2": 286.365, "r_y2": 343.652, "r_x3": 262.574, "r_y3": 343.652, "coord_origin": "TOPLEFT"}, "text": "These", "orig": "These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 364.159, "r_x1": 286.365, "r_y1": 364.159, "r_x2": 286.365, "r_y2": 355.607, "r_x3": 50.112, "r_y3": 355.607, "coord_origin": "TOPLEFT"}, "text": "implicit rules leave room for ambiguity, which we want to", "orig": "implicit rules leave room for ambiguity, which we want to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 376.114, "r_x1": 286.365, "r_y1": 376.114, "r_x2": 286.365, "r_y2": 367.562, "r_x3": 50.112, "r_y3": 367.562, "coord_origin": "TOPLEFT"}, "text": "avoid. As such, we prefer to have 'strict' tables, i.e. tables", "orig": "avoid. As such, we prefer to have 'strict' tables, i.e. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 388.069, "r_x1": 230.804, "r_y1": 388.069, "r_x2": 230.804, "r_y2": 379.517, "r_x3": 50.112, "r_y3": 379.517, "coord_origin": "TOPLEFT"}, "text": "where every row has exactly the same length.", "orig": "where every row has exactly the same length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "As a first step of our data preparation process, we have calculated statistics over the datasets across the following dimensions: (1) table size measured in the number of rows and columns, (2) complexity of the table, (3) strictness of the provided HTML structure and (4) completeness (i.e. no omitted bounding boxes). Atable is considered to be simple if it does not contain row spans or column spans. Additionally, a table has a strict HTMLstructure if every row has the same number of columns after taking into account any row or column spans. Therefore a strict HTML structure looks always rectangular. However, HTML is a lenient encoding format, i.e. tables with rows of different sizes might still be regarded as correct due to implicit display rules. These implicit rules leave room for ambiguity, which we want to avoid. As such, we prefer to have 'strict' tables, i.e. tables where every row has exactly the same length."}, {"label": "text", "id": 2, "page_no": 10, "cluster": {"id": 2, "label": "text", "bbox": {"l": 50.112, "t": 391.674, "r": 286.365, "b": 627.374, "coord_origin": "TOPLEFT"}, "confidence": 0.9826022386550903, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 400.226, "r_x1": 236.243, "r_y1": 400.226, "r_x2": 236.243, "r_y2": 391.674, "r_x3": 62.067, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "We have developed a technique that tries", "orig": "We have developed a technique that tries", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.726, "r_y0": 400.226, "r_x1": 248.477, "r_y1": 400.226, "r_x2": 248.477, "r_y2": 391.674, "r_x3": 240.726, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 252.96, "r_y0": 400.226, "r_x1": 277.458, "r_y1": 400.226, "r_x2": 277.458, "r_y2": 391.674, "r_x3": 252.96, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "derive", "orig": "derive", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.942, "r_y0": 400.226, "r_x1": 286.365, "r_y1": 400.226, "r_x2": 286.365, "r_y2": 391.674, "r_x3": 281.942, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 412.181, "r_x1": 223.571, "r_y1": 412.181, "r_x2": 223.571, "r_y2": 403.629, "r_x3": 50.112, "r_y3": 403.629, "coord_origin": "TOPLEFT"}, "text": "missing bounding box out of its neighbors.", "orig": "missing bounding box out of its neighbors.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.004, "r_y0": 412.181, "r_x1": 286.365, "r_y1": 412.181, "r_x2": 286.365, "r_y2": 403.629, "r_x3": 228.004, "r_y3": 403.629, "coord_origin": "TOPLEFT"}, "text": "As a first step,", "orig": "As a first step,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 424.136, "r_x1": 286.365, "r_y1": 424.136, "r_x2": 286.365, "r_y2": 415.584, "r_x3": 50.112, "r_y3": 415.584, "coord_origin": "TOPLEFT"}, "text": "we use the annotation data to generate the most fine-grained", "orig": "we use the annotation data to generate the most fine-grained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 436.092, "r_x1": 189.519, "r_y1": 436.092, "r_x2": 189.519, "r_y2": 427.54, "r_x3": 50.112, "r_y3": 427.54, "coord_origin": "TOPLEFT"}, "text": "grid that covers the table structure.", "orig": "grid that covers the table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.414, "r_y0": 436.092, "r_x1": 286.365, "r_y1": 436.092, "r_x2": 286.365, "r_y2": 427.54, "r_x3": 193.414, "r_y3": 427.54, "coord_origin": "TOPLEFT"}, "text": "In case of strict HTML", "orig": "In case of strict HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 448.047, "r_x1": 286.365, "r_y1": 448.047, "r_x2": 286.365, "r_y2": 439.495, "r_x3": 50.112, "r_y3": 439.495, "coord_origin": "TOPLEFT"}, "text": "tables, all grid squares are associated with some table cell", "orig": "tables, all grid squares are associated with some table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 460.002, "r_x1": 286.365, "r_y1": 460.002, "r_x2": 286.365, "r_y2": 451.45, "r_x3": 50.112, "r_y3": 451.45, "coord_origin": "TOPLEFT"}, "text": "and in the presence of table spans a cell extends across mul-", "orig": "and in the presence of table spans a cell extends across mul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 471.957, "r_x1": 286.365, "r_y1": 471.957, "r_x2": 286.365, "r_y2": 463.405, "r_x3": 50.112, "r_y3": 463.405, "coord_origin": "TOPLEFT"}, "text": "tiple grid squares. When enough bounding boxes are known", "orig": "tiple grid squares. When enough bounding boxes are known", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 483.912, "r_x1": 143.76, "r_y1": 483.912, "r_x2": 143.76, "r_y2": 475.36, "r_x3": 50.112, "r_y3": 475.36, "coord_origin": "TOPLEFT"}, "text": "for a rectangular table,", "orig": "for a rectangular table,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.696, "r_y0": 483.912, "r_x1": 153.235, "r_y1": 483.912, "r_x2": 153.235, "r_y2": 475.36, "r_x3": 147.696, "r_y3": 475.36, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 156.881, "r_y0": 483.912, "r_x1": 163.526, "r_y1": 483.912, "r_x2": 163.526, "r_y2": 475.36, "r_x3": 156.881, "r_y3": 475.36, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.173, "r_y0": 483.912, "r_x1": 286.365, "r_y1": 483.912, "r_x2": 286.365, "r_y2": 475.36, "r_x3": 167.173, "r_y3": 475.36, "coord_origin": "TOPLEFT"}, "text": "possible to compute the geo-", "orig": "possible to compute the geo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 495.867, "r_x1": 286.365, "r_y1": 495.867, "r_x2": 286.365, "r_y2": 487.315, "r_x3": 50.112, "r_y3": 487.315, "coord_origin": "TOPLEFT"}, "text": "metrical border lines between the grid rows and columns.", "orig": "metrical border lines between the grid rows and columns.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 507.823, "r_x1": 286.365, "r_y1": 507.823, "r_x2": 286.365, "r_y2": 499.271, "r_x3": 50.112, "r_y3": 499.271, "coord_origin": "TOPLEFT"}, "text": "Eventually this information is used to generate the missing", "orig": "Eventually this information is used to generate the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 519.778, "r_x1": 286.365, "r_y1": 519.778, "r_x2": 286.365, "r_y2": 511.226, "r_x3": 50.112, "r_y3": 511.226, "coord_origin": "TOPLEFT"}, "text": "bounding boxes. Additionally, the existence of unused grid", "orig": "bounding boxes. Additionally, the existence of unused grid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 531.733, "r_x1": 286.365, "r_y1": 531.733, "r_x2": 286.365, "r_y2": 523.181, "r_x3": 50.112, "r_y3": 523.181, "coord_origin": "TOPLEFT"}, "text": "squares indicates that the table rows have unequal number", "orig": "squares indicates that the table rows have unequal number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 543.688, "r_x1": 286.365, "r_y1": 543.688, "r_x2": 286.365, "r_y2": 535.136, "r_x3": 50.112, "r_y3": 535.136, "coord_origin": "TOPLEFT"}, "text": "of columns and the overall structure is non-strict. The gen-", "orig": "of columns and the overall structure is non-strict. The gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 555.643, "r_x1": 286.365, "r_y1": 555.643, "r_x2": 286.365, "r_y2": 547.091, "r_x3": 50.112, "r_y3": 547.091, "coord_origin": "TOPLEFT"}, "text": "eration of missing bounding boxes for non-strict HTML ta-", "orig": "eration of missing bounding boxes for non-strict HTML ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 567.5989999999999, "r_x1": 257.474, "r_y1": 567.5989999999999, "r_x2": 257.474, "r_y2": 559.047, "r_x3": 50.112, "r_y3": 559.047, "coord_origin": "TOPLEFT"}, "text": "bles is ambiguous and therefore quite challenging.", "orig": "bles is ambiguous and therefore quite challenging.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.949, "r_y0": 567.5989999999999, "r_x1": 286.365, "r_y1": 567.5989999999999, "r_x2": 286.365, "r_y2": 559.047, "r_x3": 263.949, "r_y3": 559.047, "coord_origin": "TOPLEFT"}, "text": "Thus,", "orig": "Thus,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 579.554, "r_x1": 242.251, "r_y1": 579.554, "r_x2": 242.251, "r_y2": 571.002, "r_x3": 50.112, "r_y3": 571.002, "coord_origin": "TOPLEFT"}, "text": "we have decided to simply discard those tables.", "orig": "we have decided to simply discard those tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.714, "r_y0": 579.554, "r_x1": 286.365, "r_y1": 579.554, "r_x2": 286.365, "r_y2": 571.002, "r_x3": 246.714, "r_y3": 571.002, "coord_origin": "TOPLEFT"}, "text": "In case of", "orig": "In case of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 591.509, "r_x1": 286.365, "r_y1": 591.509, "r_x2": 286.365, "r_y2": 582.957, "r_x3": 50.112, "r_y3": 582.957, "coord_origin": "TOPLEFT"}, "text": "PubTabNet we have computed missing bounding boxes for", "orig": "PubTabNet we have computed missing bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 603.4639999999999, "r_x1": 286.365, "r_y1": 603.4639999999999, "r_x2": 286.365, "r_y2": 594.912, "r_x3": 50.112, "r_y3": 594.912, "coord_origin": "TOPLEFT"}, "text": "48% of the simple and 69% of the complex tables. Regard-", "orig": "48% of the simple and 69% of the complex tables. Regard-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 615.419, "r_x1": 286.365, "r_y1": 615.419, "r_x2": 286.365, "r_y2": 606.867, "r_x3": 50.112, "r_y3": 606.867, "coord_origin": "TOPLEFT"}, "text": "ing FinTabNet, 68% of the simple and 98% of the complex", "orig": "ing FinTabNet, 68% of the simple and 98% of the complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 627.374, "r_x1": 242.261, "r_y1": 627.374, "r_x2": 242.261, "r_y2": 618.822, "r_x3": 50.112, "r_y3": 618.822, "coord_origin": "TOPLEFT"}, "text": "tables require the generation of bounding boxes.", "orig": "tables require the generation of bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We have developed a technique that tries to derive a missing bounding box out of its neighbors. As a first step, we use the annotation data to generate the most fine-grained grid that covers the table structure. In case of strict HTML tables, all grid squares are associated with some table cell and in the presence of table spans a cell extends across multiple grid squares. When enough bounding boxes are known for a rectangular table, it is possible to compute the geometrical border lines between the grid rows and columns. Eventually this information is used to generate the missing bounding boxes. Additionally, the existence of unused grid squares indicates that the table rows have unequal number of columns and the overall structure is non-strict. The generation of missing bounding boxes for non-strict HTML tables is ambiguous and therefore quite challenging. Thus, we have decided to simply discard those tables. In case of PubTabNet we have computed missing bounding boxes for 48% of the simple and 69% of the complex tables. Regarding FinTabNet, 68% of the simple and 98% of the complex tables require the generation of bounding boxes."}, {"label": "text", "id": 14, "page_no": 10, "cluster": {"id": 14, "label": "text", "bbox": {"l": 50.112, "t": 630.979, "r": 286.365, "b": 651.487, "coord_origin": "TOPLEFT"}, "confidence": 0.9335853457450867, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 639.531, "r_x1": 286.365, "r_y1": 639.531, "r_x2": 286.365, "r_y2": 630.979, "r_x3": 62.067, "r_y3": 630.979, "coord_origin": "TOPLEFT"}, "text": "Figure 7 illustrates the distribution of the tables across", "orig": "Figure 7 illustrates the distribution of the tables across", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 651.487, "r_x1": 179.905, "r_y1": 651.487, "r_x2": 179.905, "r_y2": 642.935, "r_x3": 50.112, "r_y3": 642.935, "coord_origin": "TOPLEFT"}, "text": "different dimensions per dataset.", "orig": "different dimensions per dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 7 illustrates the distribution of the tables across different dimensions per dataset."}, {"label": "section_header", "id": 12, "page_no": 10, "cluster": {"id": 12, "label": "section_header", "bbox": {"l": 50.112, "t": 662.39, "r": 153.608, "b": 672.242, "coord_origin": "TOPLEFT"}, "confidence": 0.9515743255615234, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 672.242, "r_x1": 153.608, "r_y1": 672.242, "r_x2": 153.608, "r_y2": 662.39, "r_x3": 50.112, "r_y3": 662.39, "coord_origin": "TOPLEFT"}, "text": "1.2. Synthetic datasets", "orig": "1.2. Synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1.2. Synthetic datasets"}, {"label": "text", "id": 3, "page_no": 10, "cluster": {"id": 3, "label": "text", "bbox": {"l": 50.112, "t": 681.6, "r": 286.365, "b": 714.062, "coord_origin": "TOPLEFT"}, "confidence": 0.9783332347869873, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 690.152, "r_x1": 286.365, "r_y1": 690.152, "r_x2": 286.365, "r_y2": 681.6, "r_x3": 62.067, "r_y3": 681.6, "coord_origin": "TOPLEFT"}, "text": "Aiming to train and evaluate our models in a broader", "orig": "Aiming to train and evaluate our models in a broader", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 702.107, "r_x1": 286.365, "r_y1": 702.107, "r_x2": 286.365, "r_y2": 693.5550000000001, "r_x3": 50.112, "r_y3": 693.5550000000001, "coord_origin": "TOPLEFT"}, "text": "spectrum of table data we have synthesized four types of", "orig": "spectrum of table data we have synthesized four types of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 714.062, "r_x1": 84.144, "r_y1": 714.062, "r_x2": 84.144, "r_y2": 705.51, "r_x3": 50.112, "r_y3": 705.51, "coord_origin": "TOPLEFT"}, "text": "datasets.", "orig": "datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.238, "r_y0": 714.062, "r_x1": 286.365, "r_y1": 714.062, "r_x2": 286.365, "r_y2": 705.51, "r_x3": 91.238, "r_y3": 705.51, "coord_origin": "TOPLEFT"}, "text": "Each one contains tables with different appear-", "orig": "Each one contains tables with different appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Aiming to train and evaluate our models in a broader spectrum of table data we have synthesized four types of datasets. Each one contains tables with different appear-"}, {"label": "text", "id": 8, "page_no": 10, "cluster": {"id": 8, "label": "text", "bbox": {"l": 308.862, "t": 162.92399999999998, "r": 545.115, "b": 207.34199999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9596064686775208, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 171.476, "r_x1": 426.929, "r_y1": 171.476, "r_x2": 426.929, "r_y2": 162.92399999999998, "r_x3": 308.862, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "ances in regard to their size,", "orig": "ances in regard to their size,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.043, "r_y0": 171.476, "r_x1": 468.393, "r_y1": 171.476, "r_x2": 468.393, "r_y2": 162.92399999999998, "r_x3": 431.043, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "structure,", "orig": "structure,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 472.508, "r_y0": 171.476, "r_x1": 491.327, "r_y1": 171.476, "r_x2": 491.327, "r_y2": 162.92399999999998, "r_x3": 472.508, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "style", "orig": "style", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 495.113, "r_y0": 171.476, "r_x1": 545.115, "r_y1": 171.476, "r_x2": 545.115, "r_y2": 162.92399999999998, "r_x3": 495.113, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "and content.", "orig": "and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 183.43100000000004, "r_x1": 545.115, "r_y1": 183.43100000000004, "r_x2": 545.115, "r_y2": 174.87900000000002, "r_x3": 308.862, "r_y3": 174.87900000000002, "coord_origin": "TOPLEFT"}, "text": "Every synthetic dataset contains 150k examples, summing", "orig": "Every synthetic dataset contains 150k examples, summing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 195.38599999999997, "r_x1": 545.115, "r_y1": 195.38599999999997, "r_x2": 545.115, "r_y2": 186.83399999999995, "r_x3": 308.862, "r_y3": 186.83399999999995, "coord_origin": "TOPLEFT"}, "text": "up to 600k synthetic examples. All datasets are divided into", "orig": "up to 600k synthetic examples. All datasets are divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 207.34199999999998, "r_x1": 484.074, "r_y1": 207.34199999999998, "r_x2": 484.074, "r_y2": 198.78999999999996, "r_x3": 308.862, "r_y3": 198.78999999999996, "coord_origin": "TOPLEFT"}, "text": "Train, Test and Val splits (80%, 10%, 10%).", "orig": "Train, Test and Val splits (80%, 10%, 10%).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "ances in regard to their size, structure, style and content. Every synthetic dataset contains 150k examples, summing up to 600k synthetic examples. All datasets are divided into Train, Test and Val splits (80%, 10%, 10%)."}, {"label": "text", "id": 15, "page_no": 10, "cluster": {"id": 15, "label": "text", "bbox": {"l": 308.862, "t": 211.50400000000002, "r": 545.115, "b": 232.01099999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.9261796474456787, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 220.05600000000004, "r_x1": 545.115, "r_y1": 220.05600000000004, "r_x2": 545.115, "r_y2": 211.50400000000002, "r_x3": 320.817, "r_y3": 211.50400000000002, "coord_origin": "TOPLEFT"}, "text": "The process of generating a synthetic dataset can be de-", "orig": "The process of generating a synthetic dataset can be de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 232.01099999999997, "r_x1": 448.089, "r_y1": 232.01099999999997, "r_x2": 448.089, "r_y2": 223.45899999999995, "r_x3": 308.862, "r_y3": 223.45899999999995, "coord_origin": "TOPLEFT"}, "text": "composed into the following steps:", "orig": "composed into the following steps:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The process of generating a synthetic dataset can be decomposed into the following steps:"}, {"label": "list_item", "id": 7, "page_no": 10, "cluster": {"id": 7, "label": "list_item", "bbox": {"l": 308.862, "t": 236.17399999999998, "r": 545.115, "b": 316.457, "coord_origin": "TOPLEFT"}, "confidence": 0.9642952680587769, "cells": [{"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 244.726, "r_x1": 328.289, "r_y1": 244.726, "r_x2": 328.289, "r_y2": 236.17399999999998, "r_x3": 320.817, "r_y3": 236.17399999999998, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 335.382, "r_y0": 244.726, "r_x1": 492.911, "r_y1": 244.726, "r_x2": 492.911, "r_y2": 236.17399999999998, "r_x3": 335.382, "r_y3": 236.17399999999998, "coord_origin": "TOPLEFT"}, "text": "Prepare styling and content templates:", "orig": "Prepare styling and content templates:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.669, "r_y0": 244.726, "r_x1": 545.115, "r_y1": 244.726, "r_x2": 545.115, "r_y2": 236.17399999999998, "r_x3": 498.669, "r_y3": 236.17399999999998, "coord_origin": "TOPLEFT"}, "text": "The styling", "orig": "The styling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 256.68100000000004, "r_x1": 545.115, "r_y1": 256.68100000000004, "r_x2": 545.115, "r_y2": 248.12900000000002, "r_x3": 308.862, "r_y3": 248.12900000000002, "coord_origin": "TOPLEFT"}, "text": "templates have been manually designed and organized into", "orig": "templates have been manually designed and organized into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 268.63599999999997, "r_x1": 481.733, "r_y1": 268.63599999999997, "r_x2": 481.733, "r_y2": 260.08399999999995, "r_x3": 308.862, "r_y3": 260.08399999999995, "coord_origin": "TOPLEFT"}, "text": "groups of scope specific appearances (e.g.", "orig": "groups of scope specific appearances (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.119, "r_y0": 268.63599999999997, "r_x1": 545.115, "r_y1": 268.63599999999997, "r_x2": 545.115, "r_y2": 260.08399999999995, "r_x3": 488.119, "r_y3": 260.08399999999995, "coord_origin": "TOPLEFT"}, "text": "financial data,", "orig": "financial data,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 280.591, "r_x1": 393.385, "r_y1": 280.591, "r_x2": 393.385, "r_y2": 272.039, "r_x3": 308.862, "r_y3": 272.039, "coord_origin": "TOPLEFT"}, "text": "marketing data, etc.)", "orig": "marketing data, etc.)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.119, "r_y0": 280.591, "r_x1": 545.115, "r_y1": 280.591, "r_x2": 545.115, "r_y2": 272.039, "r_x3": 400.119, "r_y3": 272.039, "coord_origin": "TOPLEFT"}, "text": "Additionally, we have prepared cu-", "orig": "Additionally, we have prepared cu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 292.546, "r_x1": 545.115, "r_y1": 292.546, "r_x2": 545.115, "r_y2": 283.994, "r_x3": 308.862, "r_y3": 283.994, "coord_origin": "TOPLEFT"}, "text": "rated collections of content templates by extracting the most", "orig": "rated collections of content templates by extracting the most", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 304.502, "r_x1": 349.808, "r_y1": 304.502, "r_x2": 349.808, "r_y2": 295.95, "r_x3": 308.862, "r_y3": 295.95, "coord_origin": "TOPLEFT"}, "text": "frequently", "orig": "frequently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.152, "r_y0": 304.502, "r_x1": 487.183, "r_y1": 304.502, "r_x2": 487.183, "r_y2": 295.95, "r_x3": 354.152, "r_y3": 295.95, "coord_origin": "TOPLEFT"}, "text": "used terms out of non-synthetic", "orig": "used terms out of non-synthetic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 491.526, "r_y0": 304.502, "r_x1": 523.068, "r_y1": 304.502, "r_x2": 523.068, "r_y2": 295.95, "r_x3": 491.526, "r_y3": 295.95, "coord_origin": "TOPLEFT"}, "text": "datasets", "orig": "datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 527.412, "r_y0": 304.502, "r_x1": 545.115, "r_y1": 304.502, "r_x2": 545.115, "r_y2": 295.95, "r_x3": 527.412, "r_y3": 295.95, "coord_origin": "TOPLEFT"}, "text": "(e.g.", "orig": "(e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 316.457, "r_x1": 425.693, "r_y1": 316.457, "r_x2": 425.693, "r_y2": 307.905, "r_x3": 308.862, "r_y3": 307.905, "coord_origin": "TOPLEFT"}, "text": "PubTabNet, FinTabNet, etc.).", "orig": "PubTabNet, FinTabNet, etc.).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1. Prepare styling and content templates: The styling templates have been manually designed and organized into groups of scope specific appearances (e.g. financial data, marketing data, etc.) Additionally, we have prepared curated collections of content templates by extracting the most frequently used terms out of non-synthetic datasets (e.g. PubTabNet, FinTabNet, etc.)."}, {"label": "list_item", "id": 6, "page_no": 10, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 308.862, "t": 320.619, "r": 545.115, "b": 448.723, "coord_origin": "TOPLEFT"}, "confidence": 0.9699994921684265, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 329.171, "r_x1": 328.289, "r_y1": 329.171, "r_x2": 328.289, "r_y2": 320.619, "r_x3": 320.817, "r_y3": 320.619, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.692, "r_y0": 329.171, "r_x1": 435.377, "r_y1": 329.171, "r_x2": 435.377, "r_y2": 320.619, "r_x3": 332.692, "r_y3": 320.619, "coord_origin": "TOPLEFT"}, "text": "Generate table structures:", "orig": "Generate table structures:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.342, "r_y0": 329.171, "r_x1": 545.115, "r_y1": 329.171, "r_x2": 545.115, "r_y2": 320.619, "r_x3": 439.342, "r_y3": 320.619, "coord_origin": "TOPLEFT"}, "text": "The structure of each syn-", "orig": "The structure of each syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 341.126, "r_x1": 545.115, "r_y1": 341.126, "r_x2": 545.115, "r_y2": 332.574, "r_x3": 308.862, "r_y3": 332.574, "coord_origin": "TOPLEFT"}, "text": "thetic dataset assumes a horizontal table header which po-", "orig": "thetic dataset assumes a horizontal table header which po-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 353.081, "r_x1": 341.519, "r_y1": 353.081, "r_x2": 341.519, "r_y2": 344.529, "r_x3": 308.862, "r_y3": 344.529, "coord_origin": "TOPLEFT"}, "text": "tentially", "orig": "tentially", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.813, "r_y0": 353.081, "r_x1": 427.168, "r_y1": 353.081, "r_x2": 427.168, "r_y2": 344.529, "r_x3": 345.813, "r_y3": 344.529, "coord_origin": "TOPLEFT"}, "text": "spans over multiple", "orig": "spans over multiple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.462, "r_y0": 353.081, "r_x1": 545.115, "r_y1": 353.081, "r_x2": 545.115, "r_y2": 344.529, "r_x3": 431.462, "r_y3": 344.529, "coord_origin": "TOPLEFT"}, "text": "rows and a table body that", "orig": "rows and a table body that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 365.037, "r_x1": 545.115, "r_y1": 365.037, "r_x2": 545.115, "r_y2": 356.485, "r_x3": 308.862, "r_y3": 356.485, "coord_origin": "TOPLEFT"}, "text": "may contain a combination of row spans and column spans.", "orig": "may contain a combination of row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 376.992, "r_x1": 545.115, "r_y1": 376.992, "r_x2": 545.115, "r_y2": 368.44, "r_x3": 308.862, "r_y3": 368.44, "coord_origin": "TOPLEFT"}, "text": "However, spans are not allowed to cross the header - body", "orig": "However, spans are not allowed to cross the header - body", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 388.947, "r_x1": 348.334, "r_y1": 388.947, "r_x2": 348.334, "r_y2": 380.395, "r_x3": 308.862, "r_y3": 380.395, "coord_origin": "TOPLEFT"}, "text": "boundary.", "orig": "boundary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 353.504, "r_y0": 388.947, "r_x1": 545.115, "r_y1": 388.947, "r_x2": 545.115, "r_y2": 380.395, "r_x3": 353.504, "r_y3": 380.395, "coord_origin": "TOPLEFT"}, "text": "The table structure is described by the parame-", "orig": "The table structure is described by the parame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 400.902, "r_x1": 326.018, "r_y1": 400.902, "r_x2": 326.018, "r_y2": 392.35, "r_x3": 308.862, "r_y3": 392.35, "coord_origin": "TOPLEFT"}, "text": "ters:", "orig": "ters:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.909, "r_y0": 400.902, "r_x1": 545.115, "r_y1": 400.902, "r_x2": 545.115, "r_y2": 392.35, "r_x3": 330.909, "r_y3": 392.35, "coord_origin": "TOPLEFT"}, "text": "Total number of table rows and columns, number of", "orig": "Total number of table rows and columns, number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 412.857, "r_x1": 545.115, "r_y1": 412.857, "r_x2": 545.115, "r_y2": 404.305, "r_x3": 308.862, "r_y3": 404.305, "coord_origin": "TOPLEFT"}, "text": "header rows, type of spans (header only spans, row only", "orig": "header rows, type of spans (header only spans, row only", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 424.812, "r_x1": 333.49, "r_y1": 424.812, "r_x2": 333.49, "r_y2": 416.26, "r_x3": 308.862, "r_y3": 416.26, "coord_origin": "TOPLEFT"}, "text": "spans,", "orig": "spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.082, "r_y0": 424.812, "r_x1": 418.66, "r_y1": 424.812, "r_x2": 418.66, "r_y2": 416.26, "r_x3": 338.082, "r_y3": 416.26, "coord_origin": "TOPLEFT"}, "text": "column only spans,", "orig": "column only spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.253, "r_y0": 424.812, "r_x1": 545.115, "r_y1": 424.812, "r_x2": 545.115, "r_y2": 416.26, "r_x3": 423.253, "r_y3": 416.26, "coord_origin": "TOPLEFT"}, "text": "both row and column spans),", "orig": "both row and column spans),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 436.768, "r_x1": 545.115, "r_y1": 436.768, "r_x2": 545.115, "r_y2": 428.216, "r_x3": 308.862, "r_y3": 428.216, "coord_origin": "TOPLEFT"}, "text": "maximum span size and the ratio of the table area covered", "orig": "maximum span size and the ratio of the table area covered", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 448.723, "r_x1": 345.943, "r_y1": 448.723, "r_x2": 345.943, "r_y2": 440.171, "r_x3": 308.862, "r_y3": 440.171, "coord_origin": "TOPLEFT"}, "text": "by spans.", "orig": "by spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2. Generate table structures: The structure of each synthetic dataset assumes a horizontal table header which potentially spans over multiple rows and a table body that may contain a combination of row spans and column spans. However, spans are not allowed to cross the header - body boundary. The table structure is described by the parameters: Total number of table rows and columns, number of header rows, type of spans (header only spans, row only spans, column only spans, both row and column spans), maximum span size and the ratio of the table area covered by spans."}, {"label": "list_item", "id": 9, "page_no": 10, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 308.862, "t": 452.706, "r": 545.115, "b": 497.303, "coord_origin": "TOPLEFT"}, "confidence": 0.9568928480148315, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 461.437, "r_x1": 485.758, "r_y1": 461.437, "r_x2": 485.758, "r_y2": 452.885, "r_x3": 320.817, "r_y3": 452.885, "coord_origin": "TOPLEFT"}, "text": "3. Generate content: Based on the dataset", "orig": "3. Generate content: Based on the dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.073, "r_y0": 461.294, "r_x1": 511.864, "r_y1": 461.294, "r_x2": 511.864, "r_y2": 452.706, "r_x3": 488.073, "r_y3": 452.706, "coord_origin": "TOPLEFT"}, "text": "theme", "orig": "theme", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 511.863, "r_y0": 461.437, "r_x1": 545.108, "r_y1": 461.437, "r_x2": 545.108, "r_y2": 452.885, "r_x3": 511.863, "r_y3": 452.885, "coord_origin": "TOPLEFT"}, "text": ", a set of", "orig": ", a set of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 473.392, "r_x1": 545.115, "r_y1": 473.392, "r_x2": 545.115, "r_y2": 464.84, "r_x3": 308.862, "r_y3": 464.84, "coord_origin": "TOPLEFT"}, "text": "suitable content templates is chosen first. Then, this content", "orig": "suitable content templates is chosen first. Then, this content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 485.348, "r_x1": 545.115, "r_y1": 485.348, "r_x2": 545.115, "r_y2": 476.796, "r_x3": 308.862, "r_y3": 476.796, "coord_origin": "TOPLEFT"}, "text": "can be combined with purely random text to produce the", "orig": "can be combined with purely random text to produce the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 497.303, "r_x1": 379.148, "r_y1": 497.303, "r_x2": 379.148, "r_y2": 488.751, "r_x3": 308.862, "r_y3": 488.751, "coord_origin": "TOPLEFT"}, "text": "synthetic content.", "orig": "synthetic content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3. Generate content: Based on the dataset theme , a set of suitable content templates is chosen first. Then, this content can be combined with purely random text to produce the synthetic content."}, {"label": "list_item", "id": 5, "page_no": 10, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 308.862, "t": 501.465, "r": 545.115, "b": 545.883, "coord_origin": "TOPLEFT"}, "confidence": 0.9710659980773926, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 510.017, "r_x1": 328.289, "r_y1": 510.017, "r_x2": 328.289, "r_y2": 501.465, "r_x3": 320.817, "r_y3": 501.465, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.217, "r_y0": 510.017, "r_x1": 434.082, "r_y1": 510.017, "r_x2": 434.082, "r_y2": 501.465, "r_x3": 334.217, "r_y3": 501.465, "coord_origin": "TOPLEFT"}, "text": "Apply styling templates:", "orig": "Apply styling templates:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.063, "r_y0": 510.017, "r_x1": 545.115, "r_y1": 510.017, "r_x2": 545.115, "r_y2": 501.465, "r_x3": 439.063, "r_y3": 501.465, "coord_origin": "TOPLEFT"}, "text": "Depending on the domain", "orig": "Depending on the domain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 521.972, "r_x1": 406.884, "r_y1": 521.972, "r_x2": 406.884, "r_y2": 513.4200000000001, "r_x3": 308.862, "r_y3": 513.4200000000001, "coord_origin": "TOPLEFT"}, "text": "of the synthetic dataset,", "orig": "of the synthetic dataset,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.019, "r_y0": 521.972, "r_x1": 545.115, "r_y1": 521.972, "r_x2": 545.115, "r_y2": 513.4200000000001, "r_x3": 411.019, "r_y3": 513.4200000000001, "coord_origin": "TOPLEFT"}, "text": "a set of styling templates is first", "orig": "a set of styling templates is first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.928, "r_x1": 384.299, "r_y1": 533.928, "r_x2": 384.299, "r_y2": 525.376, "r_x3": 308.862, "r_y3": 525.376, "coord_origin": "TOPLEFT"}, "text": "manually selected.", "orig": "manually selected.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.253, "r_y0": 533.928, "r_x1": 545.115, "r_y1": 533.928, "r_x2": 545.115, "r_y2": 525.376, "r_x3": 391.253, "r_y3": 525.376, "coord_origin": "TOPLEFT"}, "text": "Then, a style is randomly selected to", "orig": "Then, a style is randomly selected to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.883, "r_x1": 496.159, "r_y1": 545.883, "r_x2": 496.159, "r_y2": 537.331, "r_x3": 308.862, "r_y3": 537.331, "coord_origin": "TOPLEFT"}, "text": "format the appearance of the synthesized table.", "orig": "format the appearance of the synthesized table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4. Apply styling templates: Depending on the domain of the synthetic dataset, a set of styling templates is first manually selected. Then, a style is randomly selected to format the appearance of the synthesized table."}, {"label": "list_item", "id": 4, "page_no": 10, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 308.862, "t": 550.045, "r": 545.115, "b": 606.418, "coord_origin": "TOPLEFT"}, "confidence": 0.9778757095336914, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 558.597, "r_x1": 328.289, "r_y1": 558.597, "r_x2": 328.289, "r_y2": 550.045, "r_x3": 320.817, "r_y3": 550.045, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 335.402, "r_y0": 558.597, "r_x1": 450.371, "r_y1": 558.597, "r_x2": 450.371, "r_y2": 550.045, "r_x3": 335.402, "r_y3": 550.045, "coord_origin": "TOPLEFT"}, "text": "Render the complete tables:", "orig": "Render the complete tables:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 456.139, "r_y0": 558.597, "r_x1": 545.115, "r_y1": 558.597, "r_x2": 545.115, "r_y2": 550.045, "r_x3": 456.139, "r_y3": 550.045, "coord_origin": "TOPLEFT"}, "text": "The synthetic table is", "orig": "The synthetic table is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 570.552, "r_x1": 334.326, "r_y1": 570.552, "r_x2": 334.326, "r_y2": 562.0, "r_x3": 308.862, "r_y3": 562.0, "coord_origin": "TOPLEFT"}, "text": "finally", "orig": "finally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.983, "r_y0": 570.552, "r_x1": 545.115, "r_y1": 570.552, "r_x2": 545.115, "r_y2": 562.0, "r_x3": 337.983, "r_y3": 562.0, "coord_origin": "TOPLEFT"}, "text": "rendered by a web browser engine to generate the", "orig": "rendered by a web browser engine to generate the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 582.5070000000001, "r_x1": 545.115, "r_y1": 582.5070000000001, "r_x2": 545.115, "r_y2": 573.955, "r_x3": 308.862, "r_y3": 573.955, "coord_origin": "TOPLEFT"}, "text": "bounding boxes for each table cell. A batching technique is", "orig": "bounding boxes for each table cell. A batching technique is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 594.463, "r_x1": 545.115, "r_y1": 594.463, "r_x2": 545.115, "r_y2": 585.9110000000001, "r_x3": 308.862, "r_y3": 585.9110000000001, "coord_origin": "TOPLEFT"}, "text": "utilized to optimize the runtime overhead of the rendering", "orig": "utilized to optimize the runtime overhead of the rendering", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 606.418, "r_x1": 341.23, "r_y1": 606.418, "r_x2": 341.23, "r_y2": 597.866, "r_x3": 308.862, "r_y3": 597.866, "coord_origin": "TOPLEFT"}, "text": "process.", "orig": "process.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5. Render the complete tables: The synthetic table is finally rendered by a web browser engine to generate the bounding boxes for each table cell. A batching technique is utilized to optimize the runtime overhead of the rendering process."}, {"label": "section_header", "id": 10, "page_no": 10, "cluster": {"id": 10, "label": "section_header", "bbox": {"l": 308.862, "t": 622.2909999999999, "r": 545.109, "b": 646.987, "coord_origin": "TOPLEFT"}, "confidence": 0.954940915107727, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 633.039, "r_x1": 317.828, "r_y1": 633.039, "r_x2": 317.828, "r_y2": 622.2909999999999, "r_x3": 308.862, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.591, "r_y0": 633.039, "r_x1": 376.493, "r_y1": 633.039, "r_x2": 376.493, "r_y2": 622.2909999999999, "r_x3": 323.591, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "Prediction", "orig": "Prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.255, "r_y0": 633.039, "r_x1": 461.076, "r_y1": 633.039, "r_x2": 461.076, "r_y2": 622.2909999999999, "r_x3": 382.255, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "post-processing", "orig": "post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.826, "r_y0": 633.039, "r_x1": 481.794, "r_y1": 633.039, "r_x2": 481.794, "r_y2": 622.2909999999999, "r_x3": 466.826, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.556, "r_y0": 633.039, "r_x1": 545.109, "r_y1": 633.039, "r_x2": 545.109, "r_y2": 622.2909999999999, "r_x3": 487.556, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "PDF docu-", "orig": "PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 646.987, "r_x1": 357.341, "r_y1": 646.987, "r_x2": 357.341, "r_y2": 636.239, "r_x3": 326.795, "r_y3": 636.239, "coord_origin": "TOPLEFT"}, "text": "ments", "orig": "ments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2. Prediction post-processing for PDF documents"}, {"label": "text", "id": 1, "page_no": 10, "cluster": {"id": 1, "label": "text", "bbox": {"l": 308.862, "t": 657.69, "r": 545.115, "b": 714.063, "coord_origin": "TOPLEFT"}, "confidence": 0.9829329252243042, "cells": [{"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 666.242, "r_x1": 545.115, "r_y1": 666.242, "r_x2": 545.115, "r_y2": 657.69, "r_x3": 320.817, "r_y3": 657.69, "coord_origin": "TOPLEFT"}, "text": "Although TableFormer can predict the table structure and", "orig": "Although TableFormer can predict the table structure and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 678.197, "r_x1": 545.115, "r_y1": 678.197, "r_x2": 545.115, "r_y2": 669.645, "r_x3": 308.862, "r_y3": 669.645, "coord_origin": "TOPLEFT"}, "text": "the bounding boxes for tables recognized inside PDF docu-", "orig": "the bounding boxes for tables recognized inside PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 690.152, "r_x1": 545.115, "r_y1": 690.152, "r_x2": 545.115, "r_y2": 681.6, "r_x3": 308.862, "r_y3": 681.6, "coord_origin": "TOPLEFT"}, "text": "ments, this is not enough when a full reconstruction of the", "orig": "ments, this is not enough when a full reconstruction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 702.107, "r_x1": 545.115, "r_y1": 702.107, "r_x2": 545.115, "r_y2": 693.5550000000001, "r_x3": 308.862, "r_y3": 693.5550000000001, "coord_origin": "TOPLEFT"}, "text": "original table is required. This happens mainly due the fol-", "orig": "original table is required. This happens mainly due the fol-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 714.063, "r_x1": 371.427, "r_y1": 714.063, "r_x2": 371.427, "r_y2": 705.511, "r_x3": 308.862, "r_y3": 705.511, "coord_origin": "TOPLEFT"}, "text": "lowing reasons:", "orig": "lowing reasons:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Although TableFormer can predict the table structure and the bounding boxes for tables recognized inside PDF documents, this is not enough when a full reconstruction of the original table is required. This happens mainly due the following reasons:"}, {"label": "page_footer", "id": 16, "page_no": 10, "cluster": {"id": 16, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8986663222312927, "cells": [{"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "11"}], "body": [{"label": "section_header", "id": 18, "page_no": 10, "cluster": {"id": 18, "label": "section_header", "bbox": {"l": 132.842, "t": 110.57500000000005, "r": 465.376, "b": 135.48400000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.6497084498405457, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.842, "r_y0": 121.32299999999998, "r_x1": 465.376, "r_y1": 121.32299999999998, "r_x2": 465.376, "r_y2": 110.57500000000005, "r_x3": 132.842, "r_y3": 110.57500000000005, "coord_origin": "TOPLEFT"}, "text": "TableFormer: Table Structure Understanding with Transformers", "orig": "TableFormer: Table Structure Understanding with Transformers", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.184, "r_y0": 135.48400000000004, "r_x1": 375.043, "r_y1": 135.48400000000004, "r_x2": 375.043, "r_y2": 122.42399999999998, "r_x3": 220.184, "r_y3": 122.42399999999998, "coord_origin": "TOPLEFT"}, "text": "Supplementary Material", "orig": "Supplementary Material", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "TableFormer: Table Structure Understanding with Transformers Supplementary Material"}, {"label": "section_header", "id": 13, "page_no": 10, "cluster": {"id": 13, "label": "section_header", "bbox": {"l": 50.112, "t": 161.16099999999994, "r": 175.964, "b": 171.909, "coord_origin": "TOPLEFT"}, "confidence": 0.9454860091209412, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 171.909, "r_x1": 175.964, "r_y1": 171.909, "r_x2": 175.964, "r_y2": 161.16099999999994, "r_x3": 50.112, "r_y3": 161.16099999999994, "coord_origin": "TOPLEFT"}, "text": "1. Details on the datasets", "orig": "1. Details on the datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1. Details on the datasets"}, {"label": "section_header", "id": 11, "page_no": 10, "cluster": {"id": 11, "label": "section_header", "bbox": {"l": 50.112, "t": 180.97900000000004, "r": 150.364, "b": 190.83100000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9535645842552185, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 190.83100000000002, "r_x1": 150.364, "r_y1": 190.83100000000002, "r_x2": 150.364, "r_y2": 180.97900000000004, "r_x3": 50.112, "r_y3": 180.97900000000004, "coord_origin": "TOPLEFT"}, "text": "1.1. Data preparation", "orig": "1.1. Data preparation", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1.1. Data preparation"}, {"label": "text", "id": 0, "page_no": 10, "cluster": {"id": 0, "label": "text", "bbox": {"l": 50.112, "t": 200.18899999999996, "r": 286.365, "b": 388.069, "coord_origin": "TOPLEFT"}, "confidence": 0.9864971041679382, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 208.74099999999999, "r_x1": 286.365, "r_y1": 208.74099999999999, "r_x2": 286.365, "r_y2": 200.18899999999996, "r_x3": 62.067, "r_y3": 200.18899999999996, "coord_origin": "TOPLEFT"}, "text": "As a first step of our data preparation process, we have", "orig": "As a first step of our data preparation process, we have", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 220.697, "r_x1": 286.365, "r_y1": 220.697, "r_x2": 286.365, "r_y2": 212.14499999999998, "r_x3": 50.112, "r_y3": 212.14499999999998, "coord_origin": "TOPLEFT"}, "text": "calculated statistics over the datasets across the following", "orig": "calculated statistics over the datasets across the following", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 232.65200000000004, "r_x1": 286.365, "r_y1": 232.65200000000004, "r_x2": 286.365, "r_y2": 224.10000000000002, "r_x3": 50.112, "r_y3": 224.10000000000002, "coord_origin": "TOPLEFT"}, "text": "dimensions: (1) table size measured in the number of rows", "orig": "dimensions: (1) table size measured in the number of rows", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 244.60699999999997, "r_x1": 286.365, "r_y1": 244.60699999999997, "r_x2": 286.365, "r_y2": 236.05499999999995, "r_x3": 50.112, "r_y3": 236.05499999999995, "coord_origin": "TOPLEFT"}, "text": "and columns, (2) complexity of the table, (3) strictness of", "orig": "and columns, (2) complexity of the table, (3) strictness of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 256.562, "r_x1": 286.365, "r_y1": 256.562, "r_x2": 286.365, "r_y2": 248.01, "r_x3": 50.112, "r_y3": 248.01, "coord_origin": "TOPLEFT"}, "text": "the provided HTML structure and (4) completeness (i.e. no", "orig": "the provided HTML structure and (4) completeness (i.e. no", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 268.51700000000005, "r_x1": 286.365, "r_y1": 268.51700000000005, "r_x2": 286.365, "r_y2": 259.96500000000003, "r_x3": 50.112, "r_y3": 259.96500000000003, "coord_origin": "TOPLEFT"}, "text": "omitted bounding boxes). Atable is considered to be simple", "orig": "omitted bounding boxes). Atable is considered to be simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 280.472, "r_x1": 286.365, "r_y1": 280.472, "r_x2": 286.365, "r_y2": 271.91999999999996, "r_x3": 50.112, "r_y3": 271.91999999999996, "coord_origin": "TOPLEFT"}, "text": "if it does not contain row spans or column spans. Addition-", "orig": "if it does not contain row spans or column spans. Addition-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 292.428, "r_x1": 286.365, "r_y1": 292.428, "r_x2": 286.365, "r_y2": 283.876, "r_x3": 50.112, "r_y3": 283.876, "coord_origin": "TOPLEFT"}, "text": "ally, a table has a strict HTMLstructure if every row has the", "orig": "ally, a table has a strict HTMLstructure if every row has the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 304.383, "r_x1": 286.365, "r_y1": 304.383, "r_x2": 286.365, "r_y2": 295.831, "r_x3": 50.112, "r_y3": 295.831, "coord_origin": "TOPLEFT"}, "text": "same number of columns after taking into account any row", "orig": "same number of columns after taking into account any row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 316.338, "r_x1": 118.834, "r_y1": 316.338, "r_x2": 118.834, "r_y2": 307.786, "r_x3": 50.112, "r_y3": 307.786, "coord_origin": "TOPLEFT"}, "text": "or column spans.", "orig": "or column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 123.307, "r_y0": 316.338, "r_x1": 286.365, "r_y1": 316.338, "r_x2": 286.365, "r_y2": 307.786, "r_x3": 123.307, "r_y3": 307.786, "coord_origin": "TOPLEFT"}, "text": "Therefore a strict HTML structure looks", "orig": "Therefore a strict HTML structure looks", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 328.293, "r_x1": 127.163, "r_y1": 328.293, "r_x2": 127.163, "r_y2": 319.741, "r_x3": 50.112, "r_y3": 319.741, "coord_origin": "TOPLEFT"}, "text": "always rectangular.", "orig": "always rectangular.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 131.257, "r_y0": 328.293, "r_x1": 286.365, "r_y1": 328.293, "r_x2": 286.365, "r_y2": 319.741, "r_x3": 131.257, "r_y3": 319.741, "coord_origin": "TOPLEFT"}, "text": "However, HTML is a lenient encoding", "orig": "However, HTML is a lenient encoding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 340.248, "r_x1": 95.163, "r_y1": 340.248, "r_x2": 95.163, "r_y2": 331.696, "r_x3": 50.112, "r_y3": 331.696, "coord_origin": "TOPLEFT"}, "text": "format, i.e.", "orig": "format, i.e.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.459, "r_y0": 340.248, "r_x1": 286.365, "r_y1": 340.248, "r_x2": 286.365, "r_y2": 331.696, "r_x3": 101.459, "r_y3": 331.696, "coord_origin": "TOPLEFT"}, "text": "tables with rows of different sizes might still", "orig": "tables with rows of different sizes might still", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 352.204, "r_x1": 257.942, "r_y1": 352.204, "r_x2": 257.942, "r_y2": 343.652, "r_x3": 50.112, "r_y3": 343.652, "coord_origin": "TOPLEFT"}, "text": "be regarded as correct due to implicit display rules.", "orig": "be regarded as correct due to implicit display rules.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.574, "r_y0": 352.204, "r_x1": 286.365, "r_y1": 352.204, "r_x2": 286.365, "r_y2": 343.652, "r_x3": 262.574, "r_y3": 343.652, "coord_origin": "TOPLEFT"}, "text": "These", "orig": "These", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 364.159, "r_x1": 286.365, "r_y1": 364.159, "r_x2": 286.365, "r_y2": 355.607, "r_x3": 50.112, "r_y3": 355.607, "coord_origin": "TOPLEFT"}, "text": "implicit rules leave room for ambiguity, which we want to", "orig": "implicit rules leave room for ambiguity, which we want to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 376.114, "r_x1": 286.365, "r_y1": 376.114, "r_x2": 286.365, "r_y2": 367.562, "r_x3": 50.112, "r_y3": 367.562, "coord_origin": "TOPLEFT"}, "text": "avoid. As such, we prefer to have 'strict' tables, i.e. tables", "orig": "avoid. As such, we prefer to have 'strict' tables, i.e. tables", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 388.069, "r_x1": 230.804, "r_y1": 388.069, "r_x2": 230.804, "r_y2": 379.517, "r_x3": 50.112, "r_y3": 379.517, "coord_origin": "TOPLEFT"}, "text": "where every row has exactly the same length.", "orig": "where every row has exactly the same length.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "As a first step of our data preparation process, we have calculated statistics over the datasets across the following dimensions: (1) table size measured in the number of rows and columns, (2) complexity of the table, (3) strictness of the provided HTML structure and (4) completeness (i.e. no omitted bounding boxes). Atable is considered to be simple if it does not contain row spans or column spans. Additionally, a table has a strict HTMLstructure if every row has the same number of columns after taking into account any row or column spans. Therefore a strict HTML structure looks always rectangular. However, HTML is a lenient encoding format, i.e. tables with rows of different sizes might still be regarded as correct due to implicit display rules. These implicit rules leave room for ambiguity, which we want to avoid. As such, we prefer to have 'strict' tables, i.e. tables where every row has exactly the same length."}, {"label": "text", "id": 2, "page_no": 10, "cluster": {"id": 2, "label": "text", "bbox": {"l": 50.112, "t": 391.674, "r": 286.365, "b": 627.374, "coord_origin": "TOPLEFT"}, "confidence": 0.9826022386550903, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 400.226, "r_x1": 236.243, "r_y1": 400.226, "r_x2": 236.243, "r_y2": 391.674, "r_x3": 62.067, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "We have developed a technique that tries", "orig": "We have developed a technique that tries", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 240.726, "r_y0": 400.226, "r_x1": 248.477, "r_y1": 400.226, "r_x2": 248.477, "r_y2": 391.674, "r_x3": 240.726, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "to", "orig": "to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 252.96, "r_y0": 400.226, "r_x1": 277.458, "r_y1": 400.226, "r_x2": 277.458, "r_y2": 391.674, "r_x3": 252.96, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "derive", "orig": "derive", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 281.942, "r_y0": 400.226, "r_x1": 286.365, "r_y1": 400.226, "r_x2": 286.365, "r_y2": 391.674, "r_x3": 281.942, "r_y3": 391.674, "coord_origin": "TOPLEFT"}, "text": "a", "orig": "a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 412.181, "r_x1": 223.571, "r_y1": 412.181, "r_x2": 223.571, "r_y2": 403.629, "r_x3": 50.112, "r_y3": 403.629, "coord_origin": "TOPLEFT"}, "text": "missing bounding box out of its neighbors.", "orig": "missing bounding box out of its neighbors.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 228.004, "r_y0": 412.181, "r_x1": 286.365, "r_y1": 412.181, "r_x2": 286.365, "r_y2": 403.629, "r_x3": 228.004, "r_y3": 403.629, "coord_origin": "TOPLEFT"}, "text": "As a first step,", "orig": "As a first step,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 424.136, "r_x1": 286.365, "r_y1": 424.136, "r_x2": 286.365, "r_y2": 415.584, "r_x3": 50.112, "r_y3": 415.584, "coord_origin": "TOPLEFT"}, "text": "we use the annotation data to generate the most fine-grained", "orig": "we use the annotation data to generate the most fine-grained", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 436.092, "r_x1": 189.519, "r_y1": 436.092, "r_x2": 189.519, "r_y2": 427.54, "r_x3": 50.112, "r_y3": 427.54, "coord_origin": "TOPLEFT"}, "text": "grid that covers the table structure.", "orig": "grid that covers the table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 193.414, "r_y0": 436.092, "r_x1": 286.365, "r_y1": 436.092, "r_x2": 286.365, "r_y2": 427.54, "r_x3": 193.414, "r_y3": 427.54, "coord_origin": "TOPLEFT"}, "text": "In case of strict HTML", "orig": "In case of strict HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 448.047, "r_x1": 286.365, "r_y1": 448.047, "r_x2": 286.365, "r_y2": 439.495, "r_x3": 50.112, "r_y3": 439.495, "coord_origin": "TOPLEFT"}, "text": "tables, all grid squares are associated with some table cell", "orig": "tables, all grid squares are associated with some table cell", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 460.002, "r_x1": 286.365, "r_y1": 460.002, "r_x2": 286.365, "r_y2": 451.45, "r_x3": 50.112, "r_y3": 451.45, "coord_origin": "TOPLEFT"}, "text": "and in the presence of table spans a cell extends across mul-", "orig": "and in the presence of table spans a cell extends across mul-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 471.957, "r_x1": 286.365, "r_y1": 471.957, "r_x2": 286.365, "r_y2": 463.405, "r_x3": 50.112, "r_y3": 463.405, "coord_origin": "TOPLEFT"}, "text": "tiple grid squares. When enough bounding boxes are known", "orig": "tiple grid squares. When enough bounding boxes are known", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 483.912, "r_x1": 143.76, "r_y1": 483.912, "r_x2": 143.76, "r_y2": 475.36, "r_x3": 50.112, "r_y3": 475.36, "coord_origin": "TOPLEFT"}, "text": "for a rectangular table,", "orig": "for a rectangular table,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 147.696, "r_y0": 483.912, "r_x1": 153.235, "r_y1": 483.912, "r_x2": 153.235, "r_y2": 475.36, "r_x3": 147.696, "r_y3": 475.36, "coord_origin": "TOPLEFT"}, "text": "it", "orig": "it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 156.881, "r_y0": 483.912, "r_x1": 163.526, "r_y1": 483.912, "r_x2": 163.526, "r_y2": 475.36, "r_x3": 156.881, "r_y3": 475.36, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 167.173, "r_y0": 483.912, "r_x1": 286.365, "r_y1": 483.912, "r_x2": 286.365, "r_y2": 475.36, "r_x3": 167.173, "r_y3": 475.36, "coord_origin": "TOPLEFT"}, "text": "possible to compute the geo-", "orig": "possible to compute the geo-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 495.867, "r_x1": 286.365, "r_y1": 495.867, "r_x2": 286.365, "r_y2": 487.315, "r_x3": 50.112, "r_y3": 487.315, "coord_origin": "TOPLEFT"}, "text": "metrical border lines between the grid rows and columns.", "orig": "metrical border lines between the grid rows and columns.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 507.823, "r_x1": 286.365, "r_y1": 507.823, "r_x2": 286.365, "r_y2": 499.271, "r_x3": 50.112, "r_y3": 499.271, "coord_origin": "TOPLEFT"}, "text": "Eventually this information is used to generate the missing", "orig": "Eventually this information is used to generate the missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 519.778, "r_x1": 286.365, "r_y1": 519.778, "r_x2": 286.365, "r_y2": 511.226, "r_x3": 50.112, "r_y3": 511.226, "coord_origin": "TOPLEFT"}, "text": "bounding boxes. Additionally, the existence of unused grid", "orig": "bounding boxes. Additionally, the existence of unused grid", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 531.733, "r_x1": 286.365, "r_y1": 531.733, "r_x2": 286.365, "r_y2": 523.181, "r_x3": 50.112, "r_y3": 523.181, "coord_origin": "TOPLEFT"}, "text": "squares indicates that the table rows have unequal number", "orig": "squares indicates that the table rows have unequal number", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 543.688, "r_x1": 286.365, "r_y1": 543.688, "r_x2": 286.365, "r_y2": 535.136, "r_x3": 50.112, "r_y3": 535.136, "coord_origin": "TOPLEFT"}, "text": "of columns and the overall structure is non-strict. The gen-", "orig": "of columns and the overall structure is non-strict. The gen-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 555.643, "r_x1": 286.365, "r_y1": 555.643, "r_x2": 286.365, "r_y2": 547.091, "r_x3": 50.112, "r_y3": 547.091, "coord_origin": "TOPLEFT"}, "text": "eration of missing bounding boxes for non-strict HTML ta-", "orig": "eration of missing bounding boxes for non-strict HTML ta-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 567.5989999999999, "r_x1": 257.474, "r_y1": 567.5989999999999, "r_x2": 257.474, "r_y2": 559.047, "r_x3": 50.112, "r_y3": 559.047, "coord_origin": "TOPLEFT"}, "text": "bles is ambiguous and therefore quite challenging.", "orig": "bles is ambiguous and therefore quite challenging.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 263.949, "r_y0": 567.5989999999999, "r_x1": 286.365, "r_y1": 567.5989999999999, "r_x2": 286.365, "r_y2": 559.047, "r_x3": 263.949, "r_y3": 559.047, "coord_origin": "TOPLEFT"}, "text": "Thus,", "orig": "Thus,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 579.554, "r_x1": 242.251, "r_y1": 579.554, "r_x2": 242.251, "r_y2": 571.002, "r_x3": 50.112, "r_y3": 571.002, "coord_origin": "TOPLEFT"}, "text": "we have decided to simply discard those tables.", "orig": "we have decided to simply discard those tables.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.714, "r_y0": 579.554, "r_x1": 286.365, "r_y1": 579.554, "r_x2": 286.365, "r_y2": 571.002, "r_x3": 246.714, "r_y3": 571.002, "coord_origin": "TOPLEFT"}, "text": "In case of", "orig": "In case of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 591.509, "r_x1": 286.365, "r_y1": 591.509, "r_x2": 286.365, "r_y2": 582.957, "r_x3": 50.112, "r_y3": 582.957, "coord_origin": "TOPLEFT"}, "text": "PubTabNet we have computed missing bounding boxes for", "orig": "PubTabNet we have computed missing bounding boxes for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 603.4639999999999, "r_x1": 286.365, "r_y1": 603.4639999999999, "r_x2": 286.365, "r_y2": 594.912, "r_x3": 50.112, "r_y3": 594.912, "coord_origin": "TOPLEFT"}, "text": "48% of the simple and 69% of the complex tables. Regard-", "orig": "48% of the simple and 69% of the complex tables. Regard-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 615.419, "r_x1": 286.365, "r_y1": 615.419, "r_x2": 286.365, "r_y2": 606.867, "r_x3": 50.112, "r_y3": 606.867, "coord_origin": "TOPLEFT"}, "text": "ing FinTabNet, 68% of the simple and 98% of the complex", "orig": "ing FinTabNet, 68% of the simple and 98% of the complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 627.374, "r_x1": 242.261, "r_y1": 627.374, "r_x2": 242.261, "r_y2": 618.822, "r_x3": 50.112, "r_y3": 618.822, "coord_origin": "TOPLEFT"}, "text": "tables require the generation of bounding boxes.", "orig": "tables require the generation of bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "We have developed a technique that tries to derive a missing bounding box out of its neighbors. As a first step, we use the annotation data to generate the most fine-grained grid that covers the table structure. In case of strict HTML tables, all grid squares are associated with some table cell and in the presence of table spans a cell extends across multiple grid squares. When enough bounding boxes are known for a rectangular table, it is possible to compute the geometrical border lines between the grid rows and columns. Eventually this information is used to generate the missing bounding boxes. Additionally, the existence of unused grid squares indicates that the table rows have unequal number of columns and the overall structure is non-strict. The generation of missing bounding boxes for non-strict HTML tables is ambiguous and therefore quite challenging. Thus, we have decided to simply discard those tables. In case of PubTabNet we have computed missing bounding boxes for 48% of the simple and 69% of the complex tables. Regarding FinTabNet, 68% of the simple and 98% of the complex tables require the generation of bounding boxes."}, {"label": "text", "id": 14, "page_no": 10, "cluster": {"id": 14, "label": "text", "bbox": {"l": 50.112, "t": 630.979, "r": 286.365, "b": 651.487, "coord_origin": "TOPLEFT"}, "confidence": 0.9335853457450867, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 639.531, "r_x1": 286.365, "r_y1": 639.531, "r_x2": 286.365, "r_y2": 630.979, "r_x3": 62.067, "r_y3": 630.979, "coord_origin": "TOPLEFT"}, "text": "Figure 7 illustrates the distribution of the tables across", "orig": "Figure 7 illustrates the distribution of the tables across", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 651.487, "r_x1": 179.905, "r_y1": 651.487, "r_x2": 179.905, "r_y2": 642.935, "r_x3": 50.112, "r_y3": 642.935, "coord_origin": "TOPLEFT"}, "text": "different dimensions per dataset.", "orig": "different dimensions per dataset.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 7 illustrates the distribution of the tables across different dimensions per dataset."}, {"label": "section_header", "id": 12, "page_no": 10, "cluster": {"id": 12, "label": "section_header", "bbox": {"l": 50.112, "t": 662.39, "r": 153.608, "b": 672.242, "coord_origin": "TOPLEFT"}, "confidence": 0.9515743255615234, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 672.242, "r_x1": 153.608, "r_y1": 672.242, "r_x2": 153.608, "r_y2": 662.39, "r_x3": 50.112, "r_y3": 662.39, "coord_origin": "TOPLEFT"}, "text": "1.2. Synthetic datasets", "orig": "1.2. Synthetic datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1.2. Synthetic datasets"}, {"label": "text", "id": 3, "page_no": 10, "cluster": {"id": 3, "label": "text", "bbox": {"l": 50.112, "t": 681.6, "r": 286.365, "b": 714.062, "coord_origin": "TOPLEFT"}, "confidence": 0.9783332347869873, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 690.152, "r_x1": 286.365, "r_y1": 690.152, "r_x2": 286.365, "r_y2": 681.6, "r_x3": 62.067, "r_y3": 681.6, "coord_origin": "TOPLEFT"}, "text": "Aiming to train and evaluate our models in a broader", "orig": "Aiming to train and evaluate our models in a broader", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 702.107, "r_x1": 286.365, "r_y1": 702.107, "r_x2": 286.365, "r_y2": 693.5550000000001, "r_x3": 50.112, "r_y3": 693.5550000000001, "coord_origin": "TOPLEFT"}, "text": "spectrum of table data we have synthesized four types of", "orig": "spectrum of table data we have synthesized four types of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 714.062, "r_x1": 84.144, "r_y1": 714.062, "r_x2": 84.144, "r_y2": 705.51, "r_x3": 50.112, "r_y3": 705.51, "coord_origin": "TOPLEFT"}, "text": "datasets.", "orig": "datasets.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 91.238, "r_y0": 714.062, "r_x1": 286.365, "r_y1": 714.062, "r_x2": 286.365, "r_y2": 705.51, "r_x3": 91.238, "r_y3": 705.51, "coord_origin": "TOPLEFT"}, "text": "Each one contains tables with different appear-", "orig": "Each one contains tables with different appear-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Aiming to train and evaluate our models in a broader spectrum of table data we have synthesized four types of datasets. Each one contains tables with different appear-"}, {"label": "text", "id": 8, "page_no": 10, "cluster": {"id": 8, "label": "text", "bbox": {"l": 308.862, "t": 162.92399999999998, "r": 545.115, "b": 207.34199999999998, "coord_origin": "TOPLEFT"}, "confidence": 0.9596064686775208, "cells": [{"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 171.476, "r_x1": 426.929, "r_y1": 171.476, "r_x2": 426.929, "r_y2": 162.92399999999998, "r_x3": 308.862, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "ances in regard to their size,", "orig": "ances in regard to their size,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.043, "r_y0": 171.476, "r_x1": 468.393, "r_y1": 171.476, "r_x2": 468.393, "r_y2": 162.92399999999998, "r_x3": 431.043, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "structure,", "orig": "structure,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 472.508, "r_y0": 171.476, "r_x1": 491.327, "r_y1": 171.476, "r_x2": 491.327, "r_y2": 162.92399999999998, "r_x3": 472.508, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "style", "orig": "style", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 495.113, "r_y0": 171.476, "r_x1": 545.115, "r_y1": 171.476, "r_x2": 545.115, "r_y2": 162.92399999999998, "r_x3": 495.113, "r_y3": 162.92399999999998, "coord_origin": "TOPLEFT"}, "text": "and content.", "orig": "and content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 183.43100000000004, "r_x1": 545.115, "r_y1": 183.43100000000004, "r_x2": 545.115, "r_y2": 174.87900000000002, "r_x3": 308.862, "r_y3": 174.87900000000002, "coord_origin": "TOPLEFT"}, "text": "Every synthetic dataset contains 150k examples, summing", "orig": "Every synthetic dataset contains 150k examples, summing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 195.38599999999997, "r_x1": 545.115, "r_y1": 195.38599999999997, "r_x2": 545.115, "r_y2": 186.83399999999995, "r_x3": 308.862, "r_y3": 186.83399999999995, "coord_origin": "TOPLEFT"}, "text": "up to 600k synthetic examples. All datasets are divided into", "orig": "up to 600k synthetic examples. All datasets are divided into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 207.34199999999998, "r_x1": 484.074, "r_y1": 207.34199999999998, "r_x2": 484.074, "r_y2": 198.78999999999996, "r_x3": 308.862, "r_y3": 198.78999999999996, "coord_origin": "TOPLEFT"}, "text": "Train, Test and Val splits (80%, 10%, 10%).", "orig": "Train, Test and Val splits (80%, 10%, 10%).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "ances in regard to their size, structure, style and content. Every synthetic dataset contains 150k examples, summing up to 600k synthetic examples. All datasets are divided into Train, Test and Val splits (80%, 10%, 10%)."}, {"label": "text", "id": 15, "page_no": 10, "cluster": {"id": 15, "label": "text", "bbox": {"l": 308.862, "t": 211.50400000000002, "r": 545.115, "b": 232.01099999999997, "coord_origin": "TOPLEFT"}, "confidence": 0.9261796474456787, "cells": [{"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 220.05600000000004, "r_x1": 545.115, "r_y1": 220.05600000000004, "r_x2": 545.115, "r_y2": 211.50400000000002, "r_x3": 320.817, "r_y3": 211.50400000000002, "coord_origin": "TOPLEFT"}, "text": "The process of generating a synthetic dataset can be de-", "orig": "The process of generating a synthetic dataset can be de-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 232.01099999999997, "r_x1": 448.089, "r_y1": 232.01099999999997, "r_x2": 448.089, "r_y2": 223.45899999999995, "r_x3": 308.862, "r_y3": 223.45899999999995, "coord_origin": "TOPLEFT"}, "text": "composed into the following steps:", "orig": "composed into the following steps:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "The process of generating a synthetic dataset can be decomposed into the following steps:"}, {"label": "list_item", "id": 7, "page_no": 10, "cluster": {"id": 7, "label": "list_item", "bbox": {"l": 308.862, "t": 236.17399999999998, "r": 545.115, "b": 316.457, "coord_origin": "TOPLEFT"}, "confidence": 0.9642952680587769, "cells": [{"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 244.726, "r_x1": 328.289, "r_y1": 244.726, "r_x2": 328.289, "r_y2": 236.17399999999998, "r_x3": 320.817, "r_y3": 236.17399999999998, "coord_origin": "TOPLEFT"}, "text": "1.", "orig": "1.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 335.382, "r_y0": 244.726, "r_x1": 492.911, "r_y1": 244.726, "r_x2": 492.911, "r_y2": 236.17399999999998, "r_x3": 335.382, "r_y3": 236.17399999999998, "coord_origin": "TOPLEFT"}, "text": "Prepare styling and content templates:", "orig": "Prepare styling and content templates:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 498.669, "r_y0": 244.726, "r_x1": 545.115, "r_y1": 244.726, "r_x2": 545.115, "r_y2": 236.17399999999998, "r_x3": 498.669, "r_y3": 236.17399999999998, "coord_origin": "TOPLEFT"}, "text": "The styling", "orig": "The styling", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 256.68100000000004, "r_x1": 545.115, "r_y1": 256.68100000000004, "r_x2": 545.115, "r_y2": 248.12900000000002, "r_x3": 308.862, "r_y3": 248.12900000000002, "coord_origin": "TOPLEFT"}, "text": "templates have been manually designed and organized into", "orig": "templates have been manually designed and organized into", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 268.63599999999997, "r_x1": 481.733, "r_y1": 268.63599999999997, "r_x2": 481.733, "r_y2": 260.08399999999995, "r_x3": 308.862, "r_y3": 260.08399999999995, "coord_origin": "TOPLEFT"}, "text": "groups of scope specific appearances (e.g.", "orig": "groups of scope specific appearances (e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.119, "r_y0": 268.63599999999997, "r_x1": 545.115, "r_y1": 268.63599999999997, "r_x2": 545.115, "r_y2": 260.08399999999995, "r_x3": 488.119, "r_y3": 260.08399999999995, "coord_origin": "TOPLEFT"}, "text": "financial data,", "orig": "financial data,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 280.591, "r_x1": 393.385, "r_y1": 280.591, "r_x2": 393.385, "r_y2": 272.039, "r_x3": 308.862, "r_y3": 272.039, "coord_origin": "TOPLEFT"}, "text": "marketing data, etc.)", "orig": "marketing data, etc.)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 400.119, "r_y0": 280.591, "r_x1": 545.115, "r_y1": 280.591, "r_x2": 545.115, "r_y2": 272.039, "r_x3": 400.119, "r_y3": 272.039, "coord_origin": "TOPLEFT"}, "text": "Additionally, we have prepared cu-", "orig": "Additionally, we have prepared cu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 292.546, "r_x1": 545.115, "r_y1": 292.546, "r_x2": 545.115, "r_y2": 283.994, "r_x3": 308.862, "r_y3": 283.994, "coord_origin": "TOPLEFT"}, "text": "rated collections of content templates by extracting the most", "orig": "rated collections of content templates by extracting the most", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 304.502, "r_x1": 349.808, "r_y1": 304.502, "r_x2": 349.808, "r_y2": 295.95, "r_x3": 308.862, "r_y3": 295.95, "coord_origin": "TOPLEFT"}, "text": "frequently", "orig": "frequently", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.152, "r_y0": 304.502, "r_x1": 487.183, "r_y1": 304.502, "r_x2": 487.183, "r_y2": 295.95, "r_x3": 354.152, "r_y3": 295.95, "coord_origin": "TOPLEFT"}, "text": "used terms out of non-synthetic", "orig": "used terms out of non-synthetic", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 491.526, "r_y0": 304.502, "r_x1": 523.068, "r_y1": 304.502, "r_x2": 523.068, "r_y2": 295.95, "r_x3": 491.526, "r_y3": 295.95, "coord_origin": "TOPLEFT"}, "text": "datasets", "orig": "datasets", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 527.412, "r_y0": 304.502, "r_x1": 545.115, "r_y1": 304.502, "r_x2": 545.115, "r_y2": 295.95, "r_x3": 527.412, "r_y3": 295.95, "coord_origin": "TOPLEFT"}, "text": "(e.g.", "orig": "(e.g.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 316.457, "r_x1": 425.693, "r_y1": 316.457, "r_x2": 425.693, "r_y2": 307.905, "r_x3": 308.862, "r_y3": 307.905, "coord_origin": "TOPLEFT"}, "text": "PubTabNet, FinTabNet, etc.).", "orig": "PubTabNet, FinTabNet, etc.).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1. Prepare styling and content templates: The styling templates have been manually designed and organized into groups of scope specific appearances (e.g. financial data, marketing data, etc.) Additionally, we have prepared curated collections of content templates by extracting the most frequently used terms out of non-synthetic datasets (e.g. PubTabNet, FinTabNet, etc.)."}, {"label": "list_item", "id": 6, "page_no": 10, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 308.862, "t": 320.619, "r": 545.115, "b": 448.723, "coord_origin": "TOPLEFT"}, "confidence": 0.9699994921684265, "cells": [{"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 329.171, "r_x1": 328.289, "r_y1": 329.171, "r_x2": 328.289, "r_y2": 320.619, "r_x3": 320.817, "r_y3": 320.619, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.692, "r_y0": 329.171, "r_x1": 435.377, "r_y1": 329.171, "r_x2": 435.377, "r_y2": 320.619, "r_x3": 332.692, "r_y3": 320.619, "coord_origin": "TOPLEFT"}, "text": "Generate table structures:", "orig": "Generate table structures:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.342, "r_y0": 329.171, "r_x1": 545.115, "r_y1": 329.171, "r_x2": 545.115, "r_y2": 320.619, "r_x3": 439.342, "r_y3": 320.619, "coord_origin": "TOPLEFT"}, "text": "The structure of each syn-", "orig": "The structure of each syn-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 341.126, "r_x1": 545.115, "r_y1": 341.126, "r_x2": 545.115, "r_y2": 332.574, "r_x3": 308.862, "r_y3": 332.574, "coord_origin": "TOPLEFT"}, "text": "thetic dataset assumes a horizontal table header which po-", "orig": "thetic dataset assumes a horizontal table header which po-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 353.081, "r_x1": 341.519, "r_y1": 353.081, "r_x2": 341.519, "r_y2": 344.529, "r_x3": 308.862, "r_y3": 344.529, "coord_origin": "TOPLEFT"}, "text": "tentially", "orig": "tentially", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.813, "r_y0": 353.081, "r_x1": 427.168, "r_y1": 353.081, "r_x2": 427.168, "r_y2": 344.529, "r_x3": 345.813, "r_y3": 344.529, "coord_origin": "TOPLEFT"}, "text": "spans over multiple", "orig": "spans over multiple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 431.462, "r_y0": 353.081, "r_x1": 545.115, "r_y1": 353.081, "r_x2": 545.115, "r_y2": 344.529, "r_x3": 431.462, "r_y3": 344.529, "coord_origin": "TOPLEFT"}, "text": "rows and a table body that", "orig": "rows and a table body that", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 365.037, "r_x1": 545.115, "r_y1": 365.037, "r_x2": 545.115, "r_y2": 356.485, "r_x3": 308.862, "r_y3": 356.485, "coord_origin": "TOPLEFT"}, "text": "may contain a combination of row spans and column spans.", "orig": "may contain a combination of row spans and column spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 376.992, "r_x1": 545.115, "r_y1": 376.992, "r_x2": 545.115, "r_y2": 368.44, "r_x3": 308.862, "r_y3": 368.44, "coord_origin": "TOPLEFT"}, "text": "However, spans are not allowed to cross the header - body", "orig": "However, spans are not allowed to cross the header - body", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 388.947, "r_x1": 348.334, "r_y1": 388.947, "r_x2": 348.334, "r_y2": 380.395, "r_x3": 308.862, "r_y3": 380.395, "coord_origin": "TOPLEFT"}, "text": "boundary.", "orig": "boundary.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 353.504, "r_y0": 388.947, "r_x1": 545.115, "r_y1": 388.947, "r_x2": 545.115, "r_y2": 380.395, "r_x3": 353.504, "r_y3": 380.395, "coord_origin": "TOPLEFT"}, "text": "The table structure is described by the parame-", "orig": "The table structure is described by the parame-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 400.902, "r_x1": 326.018, "r_y1": 400.902, "r_x2": 326.018, "r_y2": 392.35, "r_x3": 308.862, "r_y3": 392.35, "coord_origin": "TOPLEFT"}, "text": "ters:", "orig": "ters:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 330.909, "r_y0": 400.902, "r_x1": 545.115, "r_y1": 400.902, "r_x2": 545.115, "r_y2": 392.35, "r_x3": 330.909, "r_y3": 392.35, "coord_origin": "TOPLEFT"}, "text": "Total number of table rows and columns, number of", "orig": "Total number of table rows and columns, number of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 412.857, "r_x1": 545.115, "r_y1": 412.857, "r_x2": 545.115, "r_y2": 404.305, "r_x3": 308.862, "r_y3": 404.305, "coord_origin": "TOPLEFT"}, "text": "header rows, type of spans (header only spans, row only", "orig": "header rows, type of spans (header only spans, row only", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 424.812, "r_x1": 333.49, "r_y1": 424.812, "r_x2": 333.49, "r_y2": 416.26, "r_x3": 308.862, "r_y3": 416.26, "coord_origin": "TOPLEFT"}, "text": "spans,", "orig": "spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 338.082, "r_y0": 424.812, "r_x1": 418.66, "r_y1": 424.812, "r_x2": 418.66, "r_y2": 416.26, "r_x3": 338.082, "r_y3": 416.26, "coord_origin": "TOPLEFT"}, "text": "column only spans,", "orig": "column only spans,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 423.253, "r_y0": 424.812, "r_x1": 545.115, "r_y1": 424.812, "r_x2": 545.115, "r_y2": 416.26, "r_x3": 423.253, "r_y3": 416.26, "coord_origin": "TOPLEFT"}, "text": "both row and column spans),", "orig": "both row and column spans),", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 436.768, "r_x1": 545.115, "r_y1": 436.768, "r_x2": 545.115, "r_y2": 428.216, "r_x3": 308.862, "r_y3": 428.216, "coord_origin": "TOPLEFT"}, "text": "maximum span size and the ratio of the table area covered", "orig": "maximum span size and the ratio of the table area covered", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 448.723, "r_x1": 345.943, "r_y1": 448.723, "r_x2": 345.943, "r_y2": 440.171, "r_x3": 308.862, "r_y3": 440.171, "coord_origin": "TOPLEFT"}, "text": "by spans.", "orig": "by spans.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2. Generate table structures: The structure of each synthetic dataset assumes a horizontal table header which potentially spans over multiple rows and a table body that may contain a combination of row spans and column spans. However, spans are not allowed to cross the header - body boundary. The table structure is described by the parameters: Total number of table rows and columns, number of header rows, type of spans (header only spans, row only spans, column only spans, both row and column spans), maximum span size and the ratio of the table area covered by spans."}, {"label": "list_item", "id": 9, "page_no": 10, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 308.862, "t": 452.706, "r": 545.115, "b": 497.303, "coord_origin": "TOPLEFT"}, "confidence": 0.9568928480148315, "cells": [{"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 461.437, "r_x1": 485.758, "r_y1": 461.437, "r_x2": 485.758, "r_y2": 452.885, "r_x3": 320.817, "r_y3": 452.885, "coord_origin": "TOPLEFT"}, "text": "3. Generate content: Based on the dataset", "orig": "3. Generate content: Based on the dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.073, "r_y0": 461.294, "r_x1": 511.864, "r_y1": 461.294, "r_x2": 511.864, "r_y2": 452.706, "r_x3": 488.073, "r_y3": 452.706, "coord_origin": "TOPLEFT"}, "text": "theme", "orig": "theme", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 511.863, "r_y0": 461.437, "r_x1": 545.108, "r_y1": 461.437, "r_x2": 545.108, "r_y2": 452.885, "r_x3": 511.863, "r_y3": 452.885, "coord_origin": "TOPLEFT"}, "text": ", a set of", "orig": ", a set of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 473.392, "r_x1": 545.115, "r_y1": 473.392, "r_x2": 545.115, "r_y2": 464.84, "r_x3": 308.862, "r_y3": 464.84, "coord_origin": "TOPLEFT"}, "text": "suitable content templates is chosen first. Then, this content", "orig": "suitable content templates is chosen first. Then, this content", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 485.348, "r_x1": 545.115, "r_y1": 485.348, "r_x2": 545.115, "r_y2": 476.796, "r_x3": 308.862, "r_y3": 476.796, "coord_origin": "TOPLEFT"}, "text": "can be combined with purely random text to produce the", "orig": "can be combined with purely random text to produce the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 497.303, "r_x1": 379.148, "r_y1": 497.303, "r_x2": 379.148, "r_y2": 488.751, "r_x3": 308.862, "r_y3": 488.751, "coord_origin": "TOPLEFT"}, "text": "synthetic content.", "orig": "synthetic content.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3. Generate content: Based on the dataset theme , a set of suitable content templates is chosen first. Then, this content can be combined with purely random text to produce the synthetic content."}, {"label": "list_item", "id": 5, "page_no": 10, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 308.862, "t": 501.465, "r": 545.115, "b": 545.883, "coord_origin": "TOPLEFT"}, "confidence": 0.9710659980773926, "cells": [{"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 510.017, "r_x1": 328.289, "r_y1": 510.017, "r_x2": 328.289, "r_y2": 501.465, "r_x3": 320.817, "r_y3": 501.465, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.217, "r_y0": 510.017, "r_x1": 434.082, "r_y1": 510.017, "r_x2": 434.082, "r_y2": 501.465, "r_x3": 334.217, "r_y3": 501.465, "coord_origin": "TOPLEFT"}, "text": "Apply styling templates:", "orig": "Apply styling templates:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 439.063, "r_y0": 510.017, "r_x1": 545.115, "r_y1": 510.017, "r_x2": 545.115, "r_y2": 501.465, "r_x3": 439.063, "r_y3": 501.465, "coord_origin": "TOPLEFT"}, "text": "Depending on the domain", "orig": "Depending on the domain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 521.972, "r_x1": 406.884, "r_y1": 521.972, "r_x2": 406.884, "r_y2": 513.4200000000001, "r_x3": 308.862, "r_y3": 513.4200000000001, "coord_origin": "TOPLEFT"}, "text": "of the synthetic dataset,", "orig": "of the synthetic dataset,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 411.019, "r_y0": 521.972, "r_x1": 545.115, "r_y1": 521.972, "r_x2": 545.115, "r_y2": 513.4200000000001, "r_x3": 411.019, "r_y3": 513.4200000000001, "coord_origin": "TOPLEFT"}, "text": "a set of styling templates is first", "orig": "a set of styling templates is first", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 533.928, "r_x1": 384.299, "r_y1": 533.928, "r_x2": 384.299, "r_y2": 525.376, "r_x3": 308.862, "r_y3": 525.376, "coord_origin": "TOPLEFT"}, "text": "manually selected.", "orig": "manually selected.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.253, "r_y0": 533.928, "r_x1": 545.115, "r_y1": 533.928, "r_x2": 545.115, "r_y2": 525.376, "r_x3": 391.253, "r_y3": 525.376, "coord_origin": "TOPLEFT"}, "text": "Then, a style is randomly selected to", "orig": "Then, a style is randomly selected to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 545.883, "r_x1": 496.159, "r_y1": 545.883, "r_x2": 496.159, "r_y2": 537.331, "r_x3": 308.862, "r_y3": 537.331, "coord_origin": "TOPLEFT"}, "text": "format the appearance of the synthesized table.", "orig": "format the appearance of the synthesized table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4. Apply styling templates: Depending on the domain of the synthetic dataset, a set of styling templates is first manually selected. Then, a style is randomly selected to format the appearance of the synthesized table."}, {"label": "list_item", "id": 4, "page_no": 10, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 308.862, "t": 550.045, "r": 545.115, "b": 606.418, "coord_origin": "TOPLEFT"}, "confidence": 0.9778757095336914, "cells": [{"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 558.597, "r_x1": 328.289, "r_y1": 558.597, "r_x2": 328.289, "r_y2": 550.045, "r_x3": 320.817, "r_y3": 550.045, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 335.402, "r_y0": 558.597, "r_x1": 450.371, "r_y1": 558.597, "r_x2": 450.371, "r_y2": 550.045, "r_x3": 335.402, "r_y3": 550.045, "coord_origin": "TOPLEFT"}, "text": "Render the complete tables:", "orig": "Render the complete tables:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 456.139, "r_y0": 558.597, "r_x1": 545.115, "r_y1": 558.597, "r_x2": 545.115, "r_y2": 550.045, "r_x3": 456.139, "r_y3": 550.045, "coord_origin": "TOPLEFT"}, "text": "The synthetic table is", "orig": "The synthetic table is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 570.552, "r_x1": 334.326, "r_y1": 570.552, "r_x2": 334.326, "r_y2": 562.0, "r_x3": 308.862, "r_y3": 562.0, "coord_origin": "TOPLEFT"}, "text": "finally", "orig": "finally", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.983, "r_y0": 570.552, "r_x1": 545.115, "r_y1": 570.552, "r_x2": 545.115, "r_y2": 562.0, "r_x3": 337.983, "r_y3": 562.0, "coord_origin": "TOPLEFT"}, "text": "rendered by a web browser engine to generate the", "orig": "rendered by a web browser engine to generate the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 582.5070000000001, "r_x1": 545.115, "r_y1": 582.5070000000001, "r_x2": 545.115, "r_y2": 573.955, "r_x3": 308.862, "r_y3": 573.955, "coord_origin": "TOPLEFT"}, "text": "bounding boxes for each table cell. A batching technique is", "orig": "bounding boxes for each table cell. A batching technique is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 594.463, "r_x1": 545.115, "r_y1": 594.463, "r_x2": 545.115, "r_y2": 585.9110000000001, "r_x3": 308.862, "r_y3": 585.9110000000001, "coord_origin": "TOPLEFT"}, "text": "utilized to optimize the runtime overhead of the rendering", "orig": "utilized to optimize the runtime overhead of the rendering", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 606.418, "r_x1": 341.23, "r_y1": 606.418, "r_x2": 341.23, "r_y2": 597.866, "r_x3": 308.862, "r_y3": 597.866, "coord_origin": "TOPLEFT"}, "text": "process.", "orig": "process.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5. Render the complete tables: The synthetic table is finally rendered by a web browser engine to generate the bounding boxes for each table cell. A batching technique is utilized to optimize the runtime overhead of the rendering process."}, {"label": "section_header", "id": 10, "page_no": 10, "cluster": {"id": 10, "label": "section_header", "bbox": {"l": 308.862, "t": 622.2909999999999, "r": 545.109, "b": 646.987, "coord_origin": "TOPLEFT"}, "confidence": 0.954940915107727, "cells": [{"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 633.039, "r_x1": 317.828, "r_y1": 633.039, "r_x2": 317.828, "r_y2": 622.2909999999999, "r_x3": 308.862, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 323.591, "r_y0": 633.039, "r_x1": 376.493, "r_y1": 633.039, "r_x2": 376.493, "r_y2": 622.2909999999999, "r_x3": 323.591, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "Prediction", "orig": "Prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 382.255, "r_y0": 633.039, "r_x1": 461.076, "r_y1": 633.039, "r_x2": 461.076, "r_y2": 622.2909999999999, "r_x3": 382.255, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "post-processing", "orig": "post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.826, "r_y0": 633.039, "r_x1": 481.794, "r_y1": 633.039, "r_x2": 481.794, "r_y2": 622.2909999999999, "r_x3": 466.826, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "for", "orig": "for", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 487.556, "r_y0": 633.039, "r_x1": 545.109, "r_y1": 633.039, "r_x2": 545.109, "r_y2": 622.2909999999999, "r_x3": 487.556, "r_y3": 622.2909999999999, "coord_origin": "TOPLEFT"}, "text": "PDF docu-", "orig": "PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.795, "r_y0": 646.987, "r_x1": 357.341, "r_y1": 646.987, "r_x2": 357.341, "r_y2": 636.239, "r_x3": 326.795, "r_y3": 636.239, "coord_origin": "TOPLEFT"}, "text": "ments", "orig": "ments", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2. Prediction post-processing for PDF documents"}, {"label": "text", "id": 1, "page_no": 10, "cluster": {"id": 1, "label": "text", "bbox": {"l": 308.862, "t": 657.69, "r": 545.115, "b": 714.063, "coord_origin": "TOPLEFT"}, "confidence": 0.9829329252243042, "cells": [{"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 666.242, "r_x1": 545.115, "r_y1": 666.242, "r_x2": 545.115, "r_y2": 657.69, "r_x3": 320.817, "r_y3": 657.69, "coord_origin": "TOPLEFT"}, "text": "Although TableFormer can predict the table structure and", "orig": "Although TableFormer can predict the table structure and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 678.197, "r_x1": 545.115, "r_y1": 678.197, "r_x2": 545.115, "r_y2": 669.645, "r_x3": 308.862, "r_y3": 669.645, "coord_origin": "TOPLEFT"}, "text": "the bounding boxes for tables recognized inside PDF docu-", "orig": "the bounding boxes for tables recognized inside PDF docu-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 690.152, "r_x1": 545.115, "r_y1": 690.152, "r_x2": 545.115, "r_y2": 681.6, "r_x3": 308.862, "r_y3": 681.6, "coord_origin": "TOPLEFT"}, "text": "ments, this is not enough when a full reconstruction of the", "orig": "ments, this is not enough when a full reconstruction of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 702.107, "r_x1": 545.115, "r_y1": 702.107, "r_x2": 545.115, "r_y2": 693.5550000000001, "r_x3": 308.862, "r_y3": 693.5550000000001, "coord_origin": "TOPLEFT"}, "text": "original table is required. This happens mainly due the fol-", "orig": "original table is required. This happens mainly due the fol-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 714.063, "r_x1": 371.427, "r_y1": 714.063, "r_x2": 371.427, "r_y2": 705.511, "r_x3": 308.862, "r_y3": 705.511, "coord_origin": "TOPLEFT"}, "text": "lowing reasons:", "orig": "lowing reasons:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Although TableFormer can predict the table structure and the bounding boxes for tables recognized inside PDF documents, this is not enough when a full reconstruction of the original table is required. This happens mainly due the following reasons:"}], "headers": [{"label": "page_footer", "id": 16, "page_no": 10, "cluster": {"id": 16, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.8986663222312927, "cells": [{"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "11", "orig": "11", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "11"}]}}, {"page_no": 11, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.391, "r_y0": 83.19600000000003, "r_x1": 151.946, "r_y1": 83.19600000000003, "r_x2": 151.946, "r_y2": 77.543, "r_x3": 119.391, "r_y3": 77.543, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.346, "r_y0": 81.077, "r_x1": 59.327, "r_y1": 81.077, "r_x2": 59.327, "r_y2": 75.42399999999998, "r_x3": 53.346, "r_y3": 75.42399999999998, "coord_origin": "TOPLEFT"}, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.579, "r_y0": 83.34400000000005, "r_x1": 319.827, "r_y1": 83.34400000000005, "r_x2": 319.827, "r_y2": 77.69100000000003, "r_x3": 289.579, "r_y3": 77.69100000000003, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.373, "r_y0": 83.13999999999999, "r_x1": 481.759, "r_y1": 83.13999999999999, "r_x2": 481.759, "r_y2": 77.48699999999997, "r_x3": 448.373, "r_y3": 77.48699999999997, "coord_origin": "TOPLEFT"}, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.553, "r_y0": 146.18100000000004, "r_x1": 105.08, "r_y1": 146.18100000000004, "r_x2": 105.08, "r_y2": 141.47000000000003, "r_x3": 82.553, "r_y3": 141.47000000000003, "coord_origin": "TOPLEFT"}, "text": "Train Val", "orig": "Train Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 63.039, "r_y0": 106.00900000000001, "r_x1": 85.29, "r_y1": 106.00900000000001, "r_x2": 85.29, "r_y2": 101.298, "r_x3": 63.039, "r_y3": 101.298, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 67.768, "r_y0": 129.29999999999995, "r_x1": 85.231, "r_y1": 129.29999999999995, "r_x2": 85.231, "r_y2": 124.58900000000006, "r_x3": 67.768, "r_y3": 124.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.551, "r_y0": 107.44500000000005, "r_x1": 249.803, "r_y1": 107.44500000000005, "r_x2": 249.803, "r_y2": 102.73400000000004, "r_x3": 227.551, "r_y3": 102.73400000000004, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.199, "r_y0": 131.89099999999996, "r_x1": 249.662, "r_y1": 131.89099999999996, "r_x2": 249.662, "r_y2": 127.17999999999995, "r_x3": 232.199, "r_y3": 127.17999999999995, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.234, "r_y0": 118.95000000000005, "r_x1": 413.697, "r_y1": 118.95000000000005, "r_x2": 413.697, "r_y2": 114.23900000000003, "r_x3": 396.234, "r_y3": 114.23900000000003, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.938, "r_y0": 90.63800000000003, "r_x1": 76.151, "r_y1": 90.63800000000003, "r_x2": 76.151, "r_y2": 85.92700000000002, "r_x3": 60.938, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.305, "r_y0": 91.12800000000004, "r_x1": 106.992, "r_y1": 91.10699999999997, "r_x2": 106.992, "r_y2": 86.39599999999996, "r_x3": 82.305, "r_y3": 86.41700000000003, "coord_origin": "TOPLEFT"}, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.205, "r_y0": 146.51099999999997, "r_x1": 271.386, "r_y1": 146.51099999999997, "r_x2": 271.386, "r_y2": 141.79999999999995, "r_x3": 246.205, "r_y3": 141.79999999999995, "coord_origin": "TOPLEFT"}, "text": "Train Test", "orig": "Train Test", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.182, "r_y0": 146.51099999999997, "r_x1": 281.88, "r_y1": 146.51099999999997, "r_x2": 281.88, "r_y2": 141.79999999999995, "r_x3": 274.182, "r_y3": 141.79999999999995, "coord_origin": "TOPLEFT"}, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 226.698, "r_y0": 90.63800000000003, "r_x1": 241.912, "r_y1": 90.63800000000003, "r_x2": 241.912, "r_y2": 85.92700000000002, "r_x3": 226.698, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.939, "r_y0": 90.99300000000005, "r_x1": 282.494, "r_y1": 91.0, "r_x2": 282.494, "r_y2": 86.28899999999999, "r_x3": 249.939, "r_y3": 86.28200000000004, "coord_origin": "TOPLEFT"}, "text": "91K 10K10K", "orig": "91K 10K10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.194, "r_y0": 146.18100000000004, "r_x1": 434.278, "r_y1": 146.32799999999997, "r_x2": 434.278, "r_y2": 141.61699999999996, "r_x3": 410.194, "r_y3": 141.47000000000003, "coord_origin": "TOPLEFT"}, "text": "Train Test", "orig": "Train Test", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.991, "r_y0": 146.32799999999997, "r_x1": 444.689, "r_y1": 146.32799999999997, "r_x2": 444.689, "r_y2": 141.61699999999996, "r_x3": 436.991, "r_y3": 141.61699999999996, "coord_origin": "TOPLEFT"}, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.373, "r_y0": 90.63800000000003, "r_x1": 406.587, "r_y1": 90.63800000000003, "r_x2": 406.587, "r_y2": 85.92700000000002, "r_x3": 391.373, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.521, "r_y0": 91.12800000000004, "r_x1": 445.624, "r_y1": 91.16600000000005, "r_x2": 445.624, "r_y2": 86.45500000000004, "r_x3": 410.521, "r_y3": 86.41700000000003, "coord_origin": "TOPLEFT"}, "text": "130K 5K 10K", "orig": "130K 5K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.949, "r_y0": 146.19299999999998, "r_x1": 156.042, "r_y1": 146.341, "r_x2": 156.042, "r_y2": 141.63, "r_x3": 113.949, "r_y3": 141.48199999999997, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.916, "r_y0": 99.72299999999996, "r_x1": 127.054, "r_y1": 99.72299999999996, "r_x2": 127.054, "r_y2": 95.01199999999994, "r_x3": 116.916, "r_y3": 95.01199999999994, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.315, "r_y0": 105.84299999999996, "r_x1": 127.053, "r_y1": 105.84299999999996, "r_x2": 127.053, "r_y2": 101.13199999999995, "r_x3": 113.315, "r_y3": 101.13199999999995, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.941, "r_y0": 111.96299999999997, "r_x1": 127.055, "r_y1": 111.96299999999997, "r_x2": 127.055, "r_y2": 107.25199999999995, "r_x3": 112.941, "r_y3": 107.25199999999995, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.227, "r_y0": 127.51999999999998, "r_x1": 126.966, "r_y1": 127.51999999999998, "r_x2": 126.966, "r_y2": 122.80899999999997, "r_x3": 113.227, "r_y3": 122.80899999999997, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.854, "r_y0": 133.64, "r_x1": 126.968, "r_y1": 133.64, "r_x2": 126.968, "r_y2": 128.92899999999997, "r_x3": 112.854, "r_y3": 128.92899999999997, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.031, "r_y0": 91.17600000000004, "r_x1": 151.042, "r_y1": 91.17100000000005, "r_x2": 151.042, "r_y2": 86.46000000000004, "r_x3": 122.031, "r_y3": 86.46500000000003, "coord_origin": "TOPLEFT"}, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 311.654, "r_y0": 91.46000000000004, "r_x1": 321.672, "r_y1": 91.46000000000004, "r_x2": 321.672, "r_y2": 86.74900000000002, "r_x3": 311.654, "r_y3": 86.74900000000002, "coord_origin": "TOPLEFT"}, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 287.894, "r_y0": 146.615, "r_x1": 328.809, "r_y1": 146.615, "r_x2": 328.809, "r_y2": 141.904, "r_x3": 287.894, "r_y3": 141.904, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.236, "r_y0": 97.98500000000001, "r_x1": 299.375, "r_y1": 97.98500000000001, "r_x2": 299.375, "r_y2": 93.274, "r_x3": 289.236, "r_y3": 93.274, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.635, "r_y0": 104.10500000000002, "r_x1": 299.373, "r_y1": 104.10500000000002, "r_x2": 299.373, "r_y2": 99.394, "r_x3": 285.635, "r_y3": 99.394, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.261, "r_y0": 110.22500000000002, "r_x1": 299.375, "r_y1": 110.22500000000002, "r_x2": 299.375, "r_y2": 105.51400000000001, "r_x3": 285.261, "r_y3": 105.51400000000001, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.431, "r_y0": 125.29499999999996, "r_x1": 299.169, "r_y1": 125.29499999999996, "r_x2": 299.169, "r_y2": 120.58399999999995, "r_x3": 285.431, "r_y3": 120.58399999999995, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.057, "r_y0": 131.41499999999996, "r_x1": 299.171, "r_y1": 131.41499999999996, "r_x2": 299.171, "r_y2": 126.70399999999995, "r_x3": 285.057, "r_y3": 126.70399999999995, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 299.584, "r_y0": 91.59799999999996, "r_x1": 309.602, "r_y1": 91.59799999999996, "r_x2": 309.602, "r_y2": 86.88699999999994, "r_x3": 299.584, "r_y3": 86.88699999999994, "coord_origin": "TOPLEFT"}, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.041, "r_y0": 146.57600000000002, "r_x1": 483.504, "r_y1": 146.57600000000002, "r_x2": 483.504, "r_y2": 141.86599999999999, "r_x3": 466.041, "r_y3": 141.86599999999999, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.022, "r_y0": 98.66600000000005, "r_x1": 469.16, "r_y1": 98.66600000000005, "r_x2": 469.16, "r_y2": 93.95500000000004, "r_x3": 459.022, "r_y3": 93.95500000000004, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.421, "r_y0": 104.78599999999994, "r_x1": 469.159, "r_y1": 104.78599999999994, "r_x2": 469.159, "r_y2": 100.07500000000005, "r_x3": 455.421, "r_y3": 100.07500000000005, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.047, "r_y0": 110.90599999999995, "r_x1": 469.161, "r_y1": 110.90599999999995, "r_x2": 469.161, "r_y2": 106.19500000000005, "r_x3": 455.047, "r_y3": 106.19500000000005, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 467.394, "r_y0": 90.47699999999998, "r_x1": 480.655, "r_y1": 90.47699999999998, "r_x2": 480.655, "r_y2": 85.76599999999996, "r_x3": 467.394, "r_y3": 85.76599999999996, "coord_origin": "TOPLEFT"}, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.377, "r_y0": 146.48900000000003, "r_x1": 202.841, "r_y1": 146.61599999999999, "r_x2": 202.841, "r_y2": 141.90499999999997, "r_x3": 160.377, "r_y3": 141.77800000000002, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.743, "r_y0": 99.76999999999998, "r_x1": 173.327, "r_y1": 99.76999999999998, "r_x2": 173.327, "r_y2": 95.05899999999997, "r_x3": 153.743, "r_y3": 95.05899999999997, "coord_origin": "TOPLEFT"}, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.51, "r_y0": 105.88999999999999, "r_x1": 173.325, "r_y1": 105.88999999999999, "r_x2": 173.325, "r_y2": 101.17899999999997, "r_x3": 154.51, "r_y3": 101.17899999999997, "coord_origin": "TOPLEFT"}, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.272, "r_y0": 112.00999999999999, "r_x1": 173.327, "r_y1": 112.00999999999999, "r_x2": 173.327, "r_y2": 107.29899999999998, "r_x3": 155.272, "r_y3": 107.29899999999998, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.413, "r_y0": 112.13699999999994, "r_x1": 345.997, "r_y1": 112.13699999999994, "r_x2": 345.997, "r_y2": 107.42600000000004, "r_x3": 326.413, "r_y3": 107.42600000000004, "coord_origin": "TOPLEFT"}, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.18, "r_y0": 118.25699999999995, "r_x1": 345.995, "r_y1": 118.25699999999995, "r_x2": 345.995, "r_y2": 113.54600000000005, "r_x3": 327.18, "r_y3": 113.54600000000005, "coord_origin": "TOPLEFT"}, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.941, "r_y0": 124.37699999999995, "r_x1": 345.996, "r_y1": 124.37699999999995, "r_x2": 345.996, "r_y2": 119.66600000000005, "r_x3": 327.941, "r_y3": 119.66600000000005, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.994, "r_y0": 109.05899999999997, "r_x1": 508.764, "r_y1": 109.05899999999997, "r_x2": 508.764, "r_y2": 104.34799999999996, "r_x3": 488.994, "r_y3": 104.34799999999996, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.189, "r_y0": 115.17899999999997, "r_x1": 508.764, "r_y1": 115.17899999999997, "r_x2": 508.764, "r_y2": 110.46799999999996, "r_x3": 490.189, "r_y3": 110.46799999999996, "coord_origin": "TOPLEFT"}, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.72, "r_y0": 121.29899999999998, "r_x1": 508.768, "r_y1": 121.29899999999998, "r_x2": 508.768, "r_y2": 116.58799999999997, "r_x3": 489.72, "r_y3": 116.58799999999997, "coord_origin": "TOPLEFT"}, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.711, "r_y0": 127.41899999999998, "r_x1": 508.766, "r_y1": 127.41899999999998, "r_x2": 508.766, "r_y2": 122.70799999999997, "r_x3": 490.711, "r_y3": 122.70799999999997, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.504, "r_y0": 91.04100000000005, "r_x1": 197.527, "r_y1": 91.0, "r_x2": 197.527, "r_y2": 86.28899999999999, "r_x3": 168.504, "r_y3": 86.33000000000004, "coord_origin": "TOPLEFT"}, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.377, "r_y0": 90.90200000000004, "r_x1": 367.395, "r_y1": 90.90200000000004, "r_x2": 367.395, "r_y2": 86.19100000000003, "r_x3": 357.377, "r_y3": 86.19100000000003, "coord_origin": "TOPLEFT"}, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.732, "r_y0": 146.52800000000002, "r_x1": 374.929, "r_y1": 146.52800000000002, "r_x2": 374.929, "r_y2": 141.817, "r_x3": 333.732, "r_y3": 141.817, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.691, "r_y0": 90.96100000000001, "r_x1": 355.709, "r_y1": 90.96100000000001, "r_x2": 355.709, "r_y2": 86.25, "r_x3": 345.691, "r_y3": 86.25, "coord_origin": "TOPLEFT"}, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 508.543, "r_y0": 146.28200000000004, "r_x1": 526.006, "r_y1": 146.28200000000004, "r_x2": 526.006, "r_y2": 141.57100000000003, "r_x3": 508.543, "r_y3": 141.57100000000003, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 510.447, "r_y0": 90.99699999999996, "r_x1": 523.707, "r_y1": 90.99699999999996, "r_x2": 523.707, "r_y2": 86.28599999999994, "r_x3": 510.447, "r_y3": 86.28599999999994, "coord_origin": "TOPLEFT"}, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 174.32299999999998, "r_x1": 86.585, "r_y1": 174.32299999999998, "r_x2": 86.585, "r_y2": 165.77099999999996, "r_x3": 50.112, "r_y3": 165.77099999999996, "coord_origin": "TOPLEFT"}, "text": "Figure 7:", "orig": "Figure 7:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.832, "r_y0": 174.32299999999998, "r_x1": 545.114, "r_y1": 174.32299999999998, "r_x2": 545.114, "r_y2": 165.77099999999996, "r_x3": 92.832, "r_y3": 165.77099999999996, "coord_origin": "TOPLEFT"}, "text": "Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "orig": "Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 186.27800000000002, "r_x1": 513.522, "r_y1": 186.27800000000002, "r_x2": 513.522, "r_y2": 177.726, "r_x3": 50.112, "r_y3": 177.726, "coord_origin": "TOPLEFT"}, "text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 219.75199999999995, "r_x1": 65.056, "r_y1": 219.75199999999995, "r_x2": 65.056, "r_y2": 211.20000000000005, "r_x3": 61.569, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 219.75199999999995, "r_x1": 286.365, "r_y1": 219.75199999999995, "r_x2": 286.365, "r_y2": 211.20000000000005, "r_x3": 70.037, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "TableFormer output does not include the table cell con-", "orig": "TableFormer output does not include the table cell con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 231.707, "r_x1": 87.472, "r_y1": 231.707, "r_x2": 87.472, "r_y2": 223.15499999999997, "r_x3": 70.037, "r_y3": 223.15499999999997, "coord_origin": "TOPLEFT"}, "text": "tent.", "orig": "tent.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 252.89200000000005, "r_x1": 65.056, "r_y1": 252.89200000000005, "r_x2": 65.056, "r_y2": 244.34000000000003, "r_x3": 61.569, "r_y3": 244.34000000000003, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 252.89200000000005, "r_x1": 286.365, "r_y1": 252.89200000000005, "r_x2": 286.365, "r_y2": 244.34000000000003, "r_x3": 70.037, "r_y3": 244.34000000000003, "coord_origin": "TOPLEFT"}, "text": "There are occasional inaccuracies in the predictions of", "orig": "There are occasional inaccuracies in the predictions of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 264.847, "r_x1": 150.415, "r_y1": 264.847, "r_x2": 150.415, "r_y2": 256.29499999999996, "r_x3": 70.037, "r_y3": 256.29499999999996, "coord_origin": "TOPLEFT"}, "text": "the bounding boxes.", "orig": "the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 288.024, "r_x1": 286.365, "r_y1": 288.024, "r_x2": 286.365, "r_y2": 279.472, "r_x3": 62.067, "r_y3": 279.472, "coord_origin": "TOPLEFT"}, "text": "However, it is possible to mitigate those limitations by", "orig": "However, it is possible to mitigate those limitations by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 299.979, "r_x1": 286.365, "r_y1": 299.979, "r_x2": 286.365, "r_y2": 291.427, "r_x3": 50.112, "r_y3": 291.427, "coord_origin": "TOPLEFT"}, "text": "combining the TableFormer predictions with the informa-", "orig": "combining the TableFormer predictions with the informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 311.934, "r_x1": 286.365, "r_y1": 311.934, "r_x2": 286.365, "r_y2": 303.382, "r_x3": 50.112, "r_y3": 303.382, "coord_origin": "TOPLEFT"}, "text": "tion already present inside a programmatic PDF document.", "orig": "tion already present inside a programmatic PDF document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 323.889, "r_x1": 123.387, "r_y1": 323.889, "r_x2": 123.387, "r_y2": 315.337, "r_x3": 50.112, "r_y3": 315.337, "coord_origin": "TOPLEFT"}, "text": "More specifically,", "orig": "More specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.348, "r_y0": 323.889, "r_x1": 286.365, "r_y1": 323.889, "r_x2": 286.365, "r_y2": 315.337, "r_x3": 128.348, "r_y3": 315.337, "coord_origin": "TOPLEFT"}, "text": "PDF documents can be seen as a se-", "orig": "PDF documents can be seen as a se-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 335.845, "r_x1": 286.365, "r_y1": 335.845, "r_x2": 286.365, "r_y2": 327.293, "r_x3": 50.112, "r_y3": 327.293, "coord_origin": "TOPLEFT"}, "text": "quence of PDF cells where each cell is described by its con-", "orig": "quence of PDF cells where each cell is described by its con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 347.8, "r_x1": 286.365, "r_y1": 347.8, "r_x2": 286.365, "r_y2": 339.248, "r_x3": 50.112, "r_y3": 339.248, "coord_origin": "TOPLEFT"}, "text": "tent and bounding box. If we are able to associate the PDF", "orig": "tent and bounding box. If we are able to associate the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 359.755, "r_x1": 286.365, "r_y1": 359.755, "r_x2": 286.365, "r_y2": 351.203, "r_x3": 50.112, "r_y3": 351.203, "coord_origin": "TOPLEFT"}, "text": "cells with the predicted table cells, we can directly link the", "orig": "cells with the predicted table cells, we can directly link the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 371.71, "r_x1": 286.365, "r_y1": 371.71, "r_x2": 286.365, "r_y2": 363.158, "r_x3": 50.112, "r_y3": 363.158, "coord_origin": "TOPLEFT"}, "text": "PDF cell content to the table cell structure and use the PDF", "orig": "PDF cell content to the table cell structure and use the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 383.665, "r_x1": 286.365, "r_y1": 383.665, "r_x2": 286.365, "r_y2": 375.113, "r_x3": 50.112, "r_y3": 375.113, "coord_origin": "TOPLEFT"}, "text": "bounding boxes to correct misalignments in the predicted", "orig": "bounding boxes to correct misalignments in the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 395.621, "r_x1": 154.56, "r_y1": 395.621, "r_x2": 154.56, "r_y2": 387.069, "r_x3": 50.112, "r_y3": 387.069, "coord_origin": "TOPLEFT"}, "text": "table cell bounding boxes.", "orig": "table cell bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 407.89, "r_x1": 286.365, "r_y1": 407.89, "r_x2": 286.365, "r_y2": 399.338, "r_x3": 62.067, "r_y3": 399.338, "coord_origin": "TOPLEFT"}, "text": "Here is a step-by-step description of the prediction post-", "orig": "Here is a step-by-step description of the prediction post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 419.846, "r_x1": 95.492, "r_y1": 419.846, "r_x2": 95.492, "r_y2": 411.294, "r_x3": 50.112, "r_y3": 411.294, "coord_origin": "TOPLEFT"}, "text": "processing:", "orig": "processing:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 432.116, "r_x1": 286.365, "r_y1": 432.116, "r_x2": 286.365, "r_y2": 423.564, "r_x3": 62.067, "r_y3": 423.564, "coord_origin": "TOPLEFT"}, "text": "1. Get the minimal grid dimensions - number of rows and", "orig": "1. Get the minimal grid dimensions - number of rows and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 444.071, "r_x1": 218.779, "r_y1": 444.071, "r_x2": 218.779, "r_y2": 435.519, "r_x3": 50.112, "r_y3": 435.519, "coord_origin": "TOPLEFT"}, "text": "columns for the predicted table structure.", "orig": "columns for the predicted table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.796, "r_y0": 444.071, "r_x1": 286.365, "r_y1": 444.071, "r_x2": 286.365, "r_y2": 435.519, "r_x3": 224.796, "r_y3": 435.519, "coord_origin": "TOPLEFT"}, "text": "This represents", "orig": "This represents", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 456.026, "r_x1": 274.51, "r_y1": 456.026, "r_x2": 274.51, "r_y2": 447.474, "r_x3": 50.112, "r_y3": 447.474, "coord_origin": "TOPLEFT"}, "text": "the most granular grid for the underlying table structure.", "orig": "the most granular grid for the underlying table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 468.296, "r_x1": 69.539, "r_y1": 468.296, "r_x2": 69.539, "r_y2": 459.744, "r_x3": 62.067, "r_y3": 459.744, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 77.429, "r_y0": 468.296, "r_x1": 286.365, "r_y1": 468.296, "r_x2": 286.365, "r_y2": 459.744, "r_x3": 77.429, "r_y3": 459.744, "coord_origin": "TOPLEFT"}, "text": "Generate pair-wise matches between the bounding", "orig": "Generate pair-wise matches between the bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 480.251, "r_x1": 286.365, "r_y1": 480.251, "r_x2": 286.365, "r_y2": 471.699, "r_x3": 50.112, "r_y3": 471.699, "coord_origin": "TOPLEFT"}, "text": "boxes of the PDF cells and the predicted cells. The Intersec-", "orig": "boxes of the PDF cells and the predicted cells. The Intersec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 492.206, "r_x1": 286.365, "r_y1": 492.206, "r_x2": 286.365, "r_y2": 483.654, "r_x3": 50.112, "r_y3": 483.654, "coord_origin": "TOPLEFT"}, "text": "tion Over Union (IOU) metric is used to evaluate the quality", "orig": "tion Over Union (IOU) metric is used to evaluate the quality", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 504.161, "r_x1": 110.705, "r_y1": 504.161, "r_x2": 110.705, "r_y2": 495.609, "r_x3": 50.112, "r_y3": 495.609, "coord_origin": "TOPLEFT"}, "text": "of the matches.", "orig": "of the matches.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 516.431, "r_x1": 69.539, "r_y1": 516.431, "r_x2": 69.539, "r_y2": 507.879, "r_x3": 62.067, "r_y3": 507.879, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 75.248, "r_y0": 516.431, "r_x1": 286.365, "r_y1": 516.431, "r_x2": 286.365, "r_y2": 507.879, "r_x3": 75.248, "r_y3": 507.879, "coord_origin": "TOPLEFT"}, "text": "Use a carefully selected IOU threshold to designate", "orig": "Use a carefully selected IOU threshold to designate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 528.387, "r_x1": 226.071, "r_y1": 528.387, "r_x2": 226.071, "r_y2": 519.835, "r_x3": 50.112, "r_y3": 519.835, "coord_origin": "TOPLEFT"}, "text": "the matches as 'good' ones and 'bad' ones.", "orig": "the matches as 'good' ones and 'bad' ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 540.656, "r_x1": 76.453, "r_y1": 540.656, "r_x2": 76.453, "r_y2": 532.104, "r_x3": 62.067, "r_y3": 532.104, "coord_origin": "TOPLEFT"}, "text": "3.a.", "orig": "3.a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 80.587, "r_y0": 540.656, "r_x1": 286.365, "r_y1": 540.656, "r_x2": 286.365, "r_y2": 532.104, "r_x3": 80.587, "r_y3": 532.104, "coord_origin": "TOPLEFT"}, "text": "If all IOU scores in a column are below the thresh-", "orig": "If all IOU scores in a column are below the thresh-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 552.612, "r_x1": 286.365, "r_y1": 552.612, "r_x2": 286.365, "r_y2": 544.06, "r_x3": 50.112, "r_y3": 544.06, "coord_origin": "TOPLEFT"}, "text": "old, discard all predictions (structure and bounding boxes)", "orig": "old, discard all predictions (structure and bounding boxes)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 564.567, "r_x1": 114.032, "r_y1": 564.567, "r_x2": 114.032, "r_y2": 556.015, "r_x3": 50.112, "r_y3": 556.015, "coord_origin": "TOPLEFT"}, "text": "for that column.", "orig": "for that column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 576.837, "r_x1": 69.539, "r_y1": 576.837, "r_x2": 69.539, "r_y2": 568.285, "r_x3": 62.067, "r_y3": 568.285, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.732, "r_y0": 576.837, "r_x1": 286.365, "r_y1": 576.837, "r_x2": 286.365, "r_y2": 568.285, "r_x3": 76.732, "r_y3": 568.285, "coord_origin": "TOPLEFT"}, "text": "Find the best-fitting content alignment for the pre-", "orig": "Find the best-fitting content alignment for the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 588.792, "r_x1": 286.365, "r_y1": 588.792, "r_x2": 286.365, "r_y2": 580.24, "r_x3": 50.112, "r_y3": 580.24, "coord_origin": "TOPLEFT"}, "text": "dicted cells with good IOU per each column. The alignment", "orig": "dicted cells with good IOU per each column. The alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 600.7470000000001, "r_x1": 278.704, "r_y1": 600.7470000000001, "r_x2": 278.704, "r_y2": 592.1949999999999, "r_x3": 50.112, "r_y3": 592.1949999999999, "coord_origin": "TOPLEFT"}, "text": "of the column can be identified by the following formula:", "orig": "of the column can be identified by the following formula:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.028, "r_y0": 632.81, "r_x1": 157.952, "r_y1": 632.81, "r_x2": 157.952, "r_y2": 624.104, "r_x3": 112.028, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.715, "r_y0": 632.81, "r_x1": 203.496, "r_y1": 632.81, "r_x2": 203.496, "r_y2": 624.104, "r_x3": 160.715, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "= arg min", "orig": "= arg min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.585, "r_y0": 640.154, "r_x1": 189.145, "r_y1": 640.154, "r_x2": 189.145, "r_y2": 634.06, "r_x3": 185.585, "r_y3": 634.06, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 203.499, "r_y0": 632.668, "r_x1": 208.48, "r_y1": 632.668, "r_x2": 208.48, "r_y2": 624.104, "r_x3": 203.499, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.481, "r_y0": 632.81, "r_x1": 216.729, "r_y1": 632.81, "r_x2": 216.729, "r_y2": 624.104, "r_x3": 208.481, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.729, "r_y0": 633.734, "r_x1": 220.289, "r_y1": 633.734, "r_x2": 220.289, "r_y2": 627.64, "r_x3": 216.729, "r_y3": 627.64, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.787, "r_y0": 632.668, "r_x1": 225.768, "r_y1": 632.668, "r_x2": 225.768, "r_y2": 624.104, "r_x3": 220.787, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.705, "r_y0": 654.075, "r_x1": 118.953, "r_y1": 654.075, "r_x2": 118.953, "r_y2": 645.369, "r_x3": 110.705, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 118.953, "r_y0": 654.998, "r_x1": 122.513, "r_y1": 654.998, "r_x2": 122.513, "r_y2": 648.904, "r_x3": 118.953, "r_y3": 648.904, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.779, "r_y0": 654.075, "r_x1": 133.528, "r_y1": 654.075, "r_x2": 133.528, "r_y2": 645.369, "r_x3": 125.779, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 136.295, "r_y0": 654.075, "r_x1": 166.678, "r_y1": 654.075, "r_x2": 166.678, "r_y2": 645.369, "r_x3": 136.295, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "max x", "orig": "max x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 156.003, "r_y0": 653.933, "r_x1": 160.984, "r_y1": 653.933, "r_x2": 160.984, "r_y2": 645.369, "r_x3": 156.003, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.678, "r_y0": 654.998, "r_x1": 170.238, "r_y1": 654.998, "r_x2": 170.238, "r_y2": 648.904, "r_x3": 166.678, "r_y3": 648.904, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.736, "r_y0": 653.933, "r_x1": 185.678, "r_y1": 653.933, "r_x2": 185.678, "r_y2": 645.369, "r_x3": 170.736, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "} -", "orig": "} -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.894, "r_y0": 654.075, "r_x1": 216.729, "r_y1": 654.075, "r_x2": 216.729, "r_y2": 645.369, "r_x3": 187.894, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "min x", "orig": "min x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.054, "r_y0": 653.933, "r_x1": 211.035, "r_y1": 653.933, "r_x2": 211.035, "r_y2": 645.369, "r_x3": 206.054, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.729, "r_y0": 654.998, "r_x1": 220.289, "r_y1": 654.998, "r_x2": 220.289, "r_y2": 648.904, "r_x3": 216.729, "r_y3": 648.904, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.787, "r_y0": 653.933, "r_x1": 225.768, "r_y1": 653.933, "r_x2": 225.768, "r_y2": 645.369, "r_x3": 220.787, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.746, "r_y0": 643.706, "r_x1": 286.362, "r_y1": 643.706, "r_x2": 286.362, "r_y2": 635.154, "r_x3": 274.746, "r_y3": 635.154, "coord_origin": "TOPLEFT"}, "text": "(4)", "orig": "(4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 676.886, "r_x1": 74.451, "r_y1": 676.886, "r_x2": 74.451, "r_y2": 668.3340000000001, "r_x3": 50.112, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.336, "r_y0": 676.722, "r_x1": 82.648, "r_y1": 676.722, "r_x2": 82.648, "r_y2": 668.016, "r_x3": 78.336, "r_y3": 668.016, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.533, "r_y0": 676.886, "r_x1": 93.178, "r_y1": 676.886, "r_x2": 93.178, "r_y2": 668.3340000000001, "r_x3": 86.533, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 97.063, "r_y0": 676.886, "r_x1": 123.634, "r_y1": 676.886, "r_x2": 123.634, "r_y2": 668.3340000000001, "r_x3": 97.063, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "one of", "orig": "one of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 127.519, "r_y0": 676.58, "r_x1": 132.5, "r_y1": 676.58, "r_x2": 132.5, "r_y2": 668.016, "r_x3": 127.519, "r_y3": 668.016, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.501, "r_y0": 676.886, "r_x1": 148.272, "r_y1": 676.886, "r_x2": 148.272, "r_y2": 668.3340000000001, "r_x3": 132.501, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "left,", "orig": "left,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.506, "r_y0": 676.886, "r_x1": 187.644, "r_y1": 676.886, "r_x2": 187.644, "r_y2": 668.3340000000001, "r_x3": 152.506, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "centroid,", "orig": "centroid,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 191.878, "r_y0": 676.886, "r_x1": 210.697, "r_y1": 676.886, "r_x2": 210.697, "r_y2": 668.3340000000001, "r_x3": 191.878, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "right", "orig": "right", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.697, "r_y0": 676.58, "r_x1": 215.678, "r_y1": 676.58, "r_x2": 215.678, "r_y2": 668.016, "r_x3": 210.697, "r_y3": 668.016, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.563, "r_y0": 676.886, "r_x1": 233.949, "r_y1": 676.886, "r_x2": 233.949, "r_y2": 668.3340000000001, "r_x3": 219.563, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 237.835, "r_y0": 676.722, "r_x1": 243.529, "r_y1": 676.722, "r_x2": 243.529, "r_y2": 668.016, "r_x3": 237.835, "r_y3": 668.016, "coord_origin": "TOPLEFT"}, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.529, "r_y0": 677.645, "r_x1": 247.089, "r_y1": 677.645, "r_x2": 247.089, "r_y2": 671.551, "r_x3": 243.529, "r_y3": 671.551, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.473, "r_y0": 676.886, "r_x1": 258.118, "r_y1": 676.886, "r_x2": 258.118, "r_y2": 668.3340000000001, "r_x3": 251.473, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.003, "r_y0": 676.886, "r_x1": 286.362, "r_y1": 676.886, "r_x2": 286.362, "r_y2": 668.3340000000001, "r_x3": 262.003, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "the x-", "orig": "the x-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 688.841, "r_x1": 205.887, "r_y1": 688.841, "r_x2": 205.887, "r_y2": 680.289, "r_x3": 50.112, "r_y3": 680.289, "coord_origin": "TOPLEFT"}, "text": "coordinate for the corresponding point.", "orig": "coordinate for the corresponding point.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 701.111, "r_x1": 69.539, "r_y1": 701.111, "r_x2": 69.539, "r_y2": 692.559, "r_x3": 62.067, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.274, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 76.274, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Use the alignment computed in step 4, to compute", "orig": "Use the alignment computed in step 4, to compute", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 94.605, "r_y1": 713.066, "r_x2": 94.605, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "the median", "orig": "the median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 97.599, "r_y0": 712.902, "r_x1": 103.293, "r_y1": 712.902, "r_x2": 103.293, "r_y2": 704.196, "r_x3": 97.599, "r_y3": 704.196, "coord_origin": "TOPLEFT"}, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.292, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 103.292, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "-coordinate for all table columns and the me-", "orig": "-coordinate for all table columns and the me-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 219.75199999999995, "r_x1": 435.915, "r_y1": 219.75199999999995, "r_x2": 435.915, "r_y2": 211.20000000000005, "r_x3": 308.862, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "dian cell size for all table cells.", "orig": "dian cell size for all table cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.697, "r_y0": 219.75199999999995, "r_x1": 545.115, "r_y1": 219.75199999999995, "r_x2": 545.115, "r_y2": 211.20000000000005, "r_x3": 440.697, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "The usage of median dur-", "orig": "The usage of median dur-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 231.70799999999997, "r_x1": 545.115, "r_y1": 231.70799999999997, "r_x2": 545.115, "r_y2": 223.15599999999995, "r_x3": 308.862, "r_y3": 223.15599999999995, "coord_origin": "TOPLEFT"}, "text": "ing the computations, helps to eliminate outliers caused by", "orig": "ing the computations, helps to eliminate outliers caused by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 243.663, "r_x1": 545.115, "r_y1": 243.663, "r_x2": 545.115, "r_y2": 235.111, "r_x3": 308.862, "r_y3": 235.111, "coord_origin": "TOPLEFT"}, "text": "occasional column spans which are usually wider than the", "orig": "occasional column spans which are usually wider than the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 255.61800000000005, "r_x1": 339.577, "r_y1": 255.61800000000005, "r_x2": 339.577, "r_y2": 247.06600000000003, "r_x3": 308.862, "r_y3": 247.06600000000003, "coord_origin": "TOPLEFT"}, "text": "normal.", "orig": "normal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 267.923, "r_x1": 328.289, "r_y1": 267.923, "r_x2": 328.289, "r_y2": 259.371, "r_x3": 320.817, "r_y3": 259.371, "coord_origin": "TOPLEFT"}, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.884, "r_y0": 267.923, "r_x1": 545.115, "r_y1": 267.923, "r_x2": 545.115, "r_y2": 259.371, "r_x3": 334.884, "r_y3": 259.371, "coord_origin": "TOPLEFT"}, "text": "Snap all cells with bad IOU to their corresponding", "orig": "Snap all cells with bad IOU to their corresponding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 279.87800000000004, "r_x1": 338.192, "r_y1": 279.87800000000004, "r_x2": 338.192, "r_y2": 271.326, "r_x3": 308.862, "r_y3": 271.326, "coord_origin": "TOPLEFT"}, "text": "median", "orig": "median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.682, "r_y0": 279.71400000000006, "r_x1": 346.376, "r_y1": 279.71400000000006, "r_x2": 346.376, "r_y2": 271.00800000000004, "r_x3": 340.682, "r_y3": 271.00800000000004, "coord_origin": "TOPLEFT"}, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.376, "r_y0": 279.87800000000004, "r_x1": 453.723, "r_y1": 279.87800000000004, "r_x2": 453.723, "r_y2": 271.326, "r_x3": 346.376, "r_y3": 271.326, "coord_origin": "TOPLEFT"}, "text": "-coordinates and cell sizes.", "orig": "-coordinates and cell sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 292.184, "r_x1": 328.289, "r_y1": 292.184, "r_x2": 328.289, "r_y2": 283.632, "r_x3": 320.817, "r_y3": 283.632, "coord_origin": "TOPLEFT"}, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.144, "r_y0": 292.184, "r_x1": 545.115, "r_y1": 292.184, "r_x2": 545.115, "r_y2": 283.632, "r_x3": 332.144, "r_y3": 283.632, "coord_origin": "TOPLEFT"}, "text": "Generate a new set of pair-wise matches between the", "orig": "Generate a new set of pair-wise matches between the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 304.139, "r_x1": 476.562, "r_y1": 304.139, "r_x2": 476.562, "r_y2": 295.587, "r_x3": 308.862, "r_y3": 295.587, "coord_origin": "TOPLEFT"}, "text": "corrected bounding boxes and PDF cells.", "orig": "corrected bounding boxes and PDF cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 482.082, "r_y0": 304.139, "r_x1": 545.115, "r_y1": 304.139, "r_x2": 545.115, "r_y2": 295.587, "r_x3": 482.082, "r_y3": 295.587, "coord_origin": "TOPLEFT"}, "text": "This time use a", "orig": "This time use a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 316.094, "r_x1": 545.115, "r_y1": 316.094, "r_x2": 545.115, "r_y2": 307.542, "r_x3": 308.862, "r_y3": 307.542, "coord_origin": "TOPLEFT"}, "text": "modified version of the IOU metric, where the area of the", "orig": "modified version of the IOU metric, where the area of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 328.049, "r_x1": 545.115, "r_y1": 328.049, "r_x2": 545.115, "r_y2": 319.497, "r_x3": 308.862, "r_y3": 319.497, "coord_origin": "TOPLEFT"}, "text": "intersection between the predicted and PDF cells is divided", "orig": "intersection between the predicted and PDF cells is divided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 340.005, "r_x1": 397.19, "r_y1": 340.005, "r_x2": 397.19, "r_y2": 331.453, "r_x3": 308.862, "r_y3": 331.453, "coord_origin": "TOPLEFT"}, "text": "by the PDF cell area.", "orig": "by the PDF cell area.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 403.656, "r_y0": 340.005, "r_x1": 545.115, "r_y1": 340.005, "r_x2": 545.115, "r_y2": 331.453, "r_x3": 403.656, "r_y3": 331.453, "coord_origin": "TOPLEFT"}, "text": "In case there are multiple matches", "orig": "In case there are multiple matches", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 351.96, "r_x1": 545.115, "r_y1": 351.96, "r_x2": 545.115, "r_y2": 343.408, "r_x3": 308.862, "r_y3": 343.408, "coord_origin": "TOPLEFT"}, "text": "for the same PDF cell, the prediction with the higher score", "orig": "for the same PDF cell, the prediction with the higher score", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 363.915, "r_x1": 357.26, "r_y1": 363.915, "r_x2": 357.26, "r_y2": 355.363, "r_x3": 308.862, "r_y3": 355.363, "coord_origin": "TOPLEFT"}, "text": "is preferred.", "orig": "is preferred.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 361.176, "r_y0": 363.915, "r_x1": 545.115, "r_y1": 363.915, "r_x2": 545.115, "r_y2": 355.363, "r_x3": 361.176, "r_y3": 355.363, "coord_origin": "TOPLEFT"}, "text": "This covers the cases where the PDF cells are", "orig": "This covers the cases where the PDF cells are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 375.87, "r_x1": 545.115, "r_y1": 375.87, "r_x2": 545.115, "r_y2": 367.318, "r_x3": 308.862, "r_y3": 367.318, "coord_origin": "TOPLEFT"}, "text": "smaller than the area of predicted or corrected prediction", "orig": "smaller than the area of predicted or corrected prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 387.825, "r_x1": 329.614, "r_y1": 387.825, "r_x2": 329.614, "r_y2": 379.273, "r_x3": 308.862, "r_y3": 379.273, "coord_origin": "TOPLEFT"}, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 400.131, "r_x1": 328.289, "r_y1": 400.131, "r_x2": 328.289, "r_y2": 391.579, "r_x3": 320.817, "r_y3": 391.579, "coord_origin": "TOPLEFT"}, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.569, "r_y0": 400.131, "r_x1": 545.115, "r_y1": 400.131, "r_x2": 545.115, "r_y2": 391.579, "r_x3": 333.569, "r_y3": 391.579, "coord_origin": "TOPLEFT"}, "text": "In some rare occasions, we have noticed that Table-", "orig": "In some rare occasions, we have noticed that Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 412.086, "r_x1": 545.115, "r_y1": 412.086, "r_x2": 545.115, "r_y2": 403.534, "r_x3": 308.862, "r_y3": 403.534, "coord_origin": "TOPLEFT"}, "text": "Former can confuse a single column as two. When the post-", "orig": "Former can confuse a single column as two. When the post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 424.041, "r_x1": 545.115, "r_y1": 424.041, "r_x2": 545.115, "r_y2": 415.489, "r_x3": 308.862, "r_y3": 415.489, "coord_origin": "TOPLEFT"}, "text": "processing steps are applied, this results with two predicted", "orig": "processing steps are applied, this results with two predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 435.996, "r_x1": 488.109, "r_y1": 435.996, "r_x2": 488.109, "r_y2": 427.444, "r_x3": 308.862, "r_y3": 427.444, "coord_origin": "TOPLEFT"}, "text": "columns pointing to the same PDF column.", "orig": "columns pointing to the same PDF column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 494.336, "r_y0": 435.996, "r_x1": 545.115, "r_y1": 435.996, "r_x2": 545.115, "r_y2": 427.444, "r_x3": 494.336, "r_y3": 427.444, "coord_origin": "TOPLEFT"}, "text": "In such case", "orig": "In such case", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 447.951, "r_x1": 545.115, "r_y1": 447.951, "r_x2": 545.115, "r_y2": 439.399, "r_x3": 308.862, "r_y3": 439.399, "coord_origin": "TOPLEFT"}, "text": "we must de-duplicate the columns according to highest to-", "orig": "we must de-duplicate the columns according to highest to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 459.906, "r_x1": 426.182, "r_y1": 459.906, "r_x2": 426.182, "r_y2": 451.354, "r_x3": 308.862, "r_y3": 451.354, "coord_origin": "TOPLEFT"}, "text": "tal column intersection score.", "orig": "tal column intersection score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 472.212, "r_x1": 328.289, "r_y1": 472.212, "r_x2": 328.289, "r_y2": 463.66, "r_x3": 320.817, "r_y3": 463.66, "coord_origin": "TOPLEFT"}, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.629, "r_y0": 472.212, "r_x1": 478.505, "r_y1": 472.212, "r_x2": 478.505, "r_y2": 463.66, "r_x3": 333.629, "r_y3": 463.66, "coord_origin": "TOPLEFT"}, "text": "Pick up the remaining orphan cells.", "orig": "Pick up the remaining orphan cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.855, "r_y0": 472.212, "r_x1": 545.115, "r_y1": 472.212, "r_x2": 545.115, "r_y2": 463.66, "r_x3": 483.855, "r_y3": 463.66, "coord_origin": "TOPLEFT"}, "text": "There could be", "orig": "There could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 484.167, "r_x1": 545.115, "r_y1": 484.167, "r_x2": 545.115, "r_y2": 475.615, "r_x3": 308.862, "r_y3": 475.615, "coord_origin": "TOPLEFT"}, "text": "cases, when after applying all the previous post-processing", "orig": "cases, when after applying all the previous post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 496.122, "r_x1": 545.115, "r_y1": 496.122, "r_x2": 545.115, "r_y2": 487.57, "r_x3": 308.862, "r_y3": 487.57, "coord_origin": "TOPLEFT"}, "text": "steps, some PDF cells could still remain without any match", "orig": "steps, some PDF cells could still remain without any match", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 508.077, "r_x1": 381.898, "r_y1": 508.077, "r_x2": 381.898, "r_y2": 499.525, "r_x3": 308.862, "r_y3": 499.525, "coord_origin": "TOPLEFT"}, "text": "to predicted cells.", "orig": "to predicted cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 388.702, "r_y0": 508.077, "r_x1": 545.115, "r_y1": 508.077, "r_x2": 545.115, "r_y2": 499.525, "r_x3": 388.702, "r_y3": 499.525, "coord_origin": "TOPLEFT"}, "text": "However, it is still possible to deduce", "orig": "However, it is still possible to deduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 520.033, "r_x1": 545.115, "r_y1": 520.033, "r_x2": 545.115, "r_y2": 511.481, "r_x3": 308.862, "r_y3": 511.481, "coord_origin": "TOPLEFT"}, "text": "the correct matching for an orphan PDF cell by mapping its", "orig": "the correct matching for an orphan PDF cell by mapping its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 531.988, "r_x1": 483.576, "r_y1": 531.988, "r_x2": 483.576, "r_y2": 523.4359999999999, "r_x3": 308.862, "r_y3": 523.4359999999999, "coord_origin": "TOPLEFT"}, "text": "bounding box on the geometry of the grid.", "orig": "bounding box on the geometry of the grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.195, "r_y0": 531.988, "r_x1": 545.115, "r_y1": 531.988, "r_x2": 545.115, "r_y2": 523.4359999999999, "r_x3": 489.195, "r_y3": 523.4359999999999, "coord_origin": "TOPLEFT"}, "text": "This mapping", "orig": "This mapping", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 543.943, "r_x1": 545.115, "r_y1": 543.943, "r_x2": 545.115, "r_y2": 535.3910000000001, "r_x3": 308.862, "r_y3": 535.3910000000001, "coord_origin": "TOPLEFT"}, "text": "decides if the content of the orphan cell will be appended to", "orig": "decides if the content of the orphan cell will be appended to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 555.898, "r_x1": 545.115, "r_y1": 555.898, "r_x2": 545.115, "r_y2": 547.346, "r_x3": 308.862, "r_y3": 547.346, "coord_origin": "TOPLEFT"}, "text": "an already matched table cell, or a new table cell should be", "orig": "an already matched table cell, or a new table cell should be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 567.8530000000001, "r_x1": 442.221, "r_y1": 567.8530000000001, "r_x2": 442.221, "r_y2": 559.3009999999999, "r_x3": 308.862, "r_y3": 559.3009999999999, "coord_origin": "TOPLEFT"}, "text": "created to match with the orphan.", "orig": "created to match with the orphan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 580.159, "r_x1": 332.712, "r_y1": 580.159, "r_x2": 332.712, "r_y2": 571.607, "r_x3": 320.817, "r_y3": 571.607, "coord_origin": "TOPLEFT"}, "text": "9a.", "orig": "9a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.943, "r_y0": 580.159, "r_x1": 545.115, "r_y1": 580.159, "r_x2": 545.115, "r_y2": 571.607, "r_x3": 337.943, "r_y3": 571.607, "coord_origin": "TOPLEFT"}, "text": "Compute the top and bottom boundary of the hori-", "orig": "Compute the top and bottom boundary of the hori-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 592.114, "r_x1": 471.641, "r_y1": 592.114, "r_x2": 471.641, "r_y2": 583.562, "r_x3": 308.862, "r_y3": 583.562, "coord_origin": "TOPLEFT"}, "text": "zontal band for each grid row (min/max", "orig": "zontal band for each grid row (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 474.834, "r_y0": 591.95, "r_x1": 479.719, "r_y1": 591.95, "r_x2": 479.719, "r_y2": 583.244, "r_x3": 474.834, "r_y3": 583.244, "coord_origin": "TOPLEFT"}, "text": "y", "orig": "y", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.269, "r_y0": 592.114, "r_x1": 545.117, "r_y1": 592.114, "r_x2": 545.117, "r_y2": 583.562, "r_x3": 483.269, "r_y3": 583.562, "coord_origin": "TOPLEFT"}, "text": "coordinates per", "orig": "coordinates per", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 604.069, "r_x1": 329.913, "r_y1": 604.069, "r_x2": 329.913, "r_y2": 595.517, "r_x3": 308.862, "r_y3": 595.517, "coord_origin": "TOPLEFT"}, "text": "row).", "orig": "row).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 616.374, "r_x1": 332.872, "r_y1": 616.374, "r_x2": 332.872, "r_y2": 607.822, "r_x3": 320.817, "r_y3": 607.822, "coord_origin": "TOPLEFT"}, "text": "9b.", "orig": "9b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.925, "r_y0": 616.374, "r_x1": 374.226, "r_y1": 616.374, "r_x2": 374.226, "r_y2": 607.822, "r_x3": 339.925, "r_y3": 607.822, "coord_origin": "TOPLEFT"}, "text": "Intersect", "orig": "Intersect", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 378.042, "r_y0": 616.374, "r_x1": 545.115, "r_y1": 616.374, "r_x2": 545.115, "r_y2": 607.822, "r_x3": 378.042, "r_y3": 607.822, "coord_origin": "TOPLEFT"}, "text": "the orphan's bounding box with the row", "orig": "the orphan's bounding box with the row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 628.33, "r_x1": 495.292, "r_y1": 628.33, "r_x2": 495.292, "r_y2": 619.778, "r_x3": 308.862, "r_y3": 619.778, "coord_origin": "TOPLEFT"}, "text": "bands, and map the cell to the closest grid row.", "orig": "bands, and map the cell to the closest grid row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 640.635, "r_x1": 332.712, "r_y1": 640.635, "r_x2": 332.712, "r_y2": 632.083, "r_x3": 320.817, "r_y3": 632.083, "coord_origin": "TOPLEFT"}, "text": "9c.", "orig": "9c.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.534, "r_y0": 640.635, "r_x1": 545.115, "r_y1": 640.635, "r_x2": 545.115, "r_y2": 632.083, "r_x3": 337.534, "r_y3": 632.083, "coord_origin": "TOPLEFT"}, "text": "Compute the left and right boundary of the vertical", "orig": "Compute the left and right boundary of the vertical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 652.59, "r_x1": 455.282, "r_y1": 652.59, "r_x2": 455.282, "r_y2": 644.038, "r_x3": 308.862, "r_y3": 644.038, "coord_origin": "TOPLEFT"}, "text": "band for each grid column (min/max", "orig": "band for each grid column (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 457.777, "r_y0": 652.4259999999999, "r_x1": 463.471, "r_y1": 652.4259999999999, "r_x2": 463.471, "r_y2": 643.72, "r_x3": 457.777, "r_y3": 643.72, "coord_origin": "TOPLEFT"}, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.971, "r_y0": 652.59, "r_x1": 545.114, "r_y1": 652.59, "r_x2": 545.114, "r_y2": 644.038, "r_x3": 465.971, "r_y3": 644.038, "coord_origin": "TOPLEFT"}, "text": "coordinates per col-", "orig": "coordinates per col-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 664.545, "r_x1": 332.384, "r_y1": 664.545, "r_x2": 332.384, "r_y2": 655.9929999999999, "r_x3": 308.862, "r_y3": 655.9929999999999, "coord_origin": "TOPLEFT"}, "text": "umn).", "orig": "umn).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 676.851, "r_x1": 545.115, "r_y1": 676.851, "r_x2": 545.115, "r_y2": 668.299, "r_x3": 320.817, "r_y3": 668.299, "coord_origin": "TOPLEFT"}, "text": "9d. Intersect the orphan's bounding box with the column", "orig": "9d. Intersect the orphan's bounding box with the column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 688.806, "r_x1": 510.585, "r_y1": 688.806, "r_x2": 510.585, "r_y2": 680.254, "r_x3": 308.862, "r_y3": 680.254, "coord_origin": "TOPLEFT"}, "text": "bands, and map the cell to the closest grid column.", "orig": "bands, and map the cell to the closest grid column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 320.817, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "9e. If the table cell under the identified row and column", "orig": "9e. If the table cell under the identified row and column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "is not empty, extend its content with the content of the or-", "orig": "is not empty, extend its content with the content of the or-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 30, "label": "picture", "bbox": {"l": 53.54227066040039, "t": 74.74854278564453, "r": 544.938232421875, "b": 147.59091186523438, "coord_origin": "TOPLEFT"}, "confidence": 0.6033818125724792, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.391, "r_y0": 83.19600000000003, "r_x1": 151.946, "r_y1": 83.19600000000003, "r_x2": 151.946, "r_y2": 77.543, "r_x3": 119.391, "r_y3": 77.543, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.346, "r_y0": 81.077, "r_x1": 59.327, "r_y1": 81.077, "r_x2": 59.327, "r_y2": 75.42399999999998, "r_x3": 53.346, "r_y3": 75.42399999999998, "coord_origin": "TOPLEFT"}, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.579, "r_y0": 83.34400000000005, "r_x1": 319.827, "r_y1": 83.34400000000005, "r_x2": 319.827, "r_y2": 77.69100000000003, "r_x3": 289.579, "r_y3": 77.69100000000003, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.373, "r_y0": 83.13999999999999, "r_x1": 481.759, "r_y1": 83.13999999999999, "r_x2": 481.759, "r_y2": 77.48699999999997, "r_x3": 448.373, "r_y3": 77.48699999999997, "coord_origin": "TOPLEFT"}, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.553, "r_y0": 146.18100000000004, "r_x1": 105.08, "r_y1": 146.18100000000004, "r_x2": 105.08, "r_y2": 141.47000000000003, "r_x3": 82.553, "r_y3": 141.47000000000003, "coord_origin": "TOPLEFT"}, "text": "Train Val", "orig": "Train Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 63.039, "r_y0": 106.00900000000001, "r_x1": 85.29, "r_y1": 106.00900000000001, "r_x2": 85.29, "r_y2": 101.298, "r_x3": 63.039, "r_y3": 101.298, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 67.768, "r_y0": 129.29999999999995, "r_x1": 85.231, "r_y1": 129.29999999999995, "r_x2": 85.231, "r_y2": 124.58900000000006, "r_x3": 67.768, "r_y3": 124.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.551, "r_y0": 107.44500000000005, "r_x1": 249.803, "r_y1": 107.44500000000005, "r_x2": 249.803, "r_y2": 102.73400000000004, "r_x3": 227.551, "r_y3": 102.73400000000004, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.199, "r_y0": 131.89099999999996, "r_x1": 249.662, "r_y1": 131.89099999999996, "r_x2": 249.662, "r_y2": 127.17999999999995, "r_x3": 232.199, "r_y3": 127.17999999999995, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.234, "r_y0": 118.95000000000005, "r_x1": 413.697, "r_y1": 118.95000000000005, "r_x2": 413.697, "r_y2": 114.23900000000003, "r_x3": 396.234, "r_y3": 114.23900000000003, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.938, "r_y0": 90.63800000000003, "r_x1": 76.151, "r_y1": 90.63800000000003, "r_x2": 76.151, "r_y2": 85.92700000000002, "r_x3": 60.938, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.305, "r_y0": 91.12800000000004, "r_x1": 106.992, "r_y1": 91.10699999999997, "r_x2": 106.992, "r_y2": 86.39599999999996, "r_x3": 82.305, "r_y3": 86.41700000000003, "coord_origin": "TOPLEFT"}, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.205, "r_y0": 146.51099999999997, "r_x1": 271.386, "r_y1": 146.51099999999997, "r_x2": 271.386, "r_y2": 141.79999999999995, "r_x3": 246.205, "r_y3": 141.79999999999995, "coord_origin": "TOPLEFT"}, "text": "Train Test", "orig": "Train Test", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.182, "r_y0": 146.51099999999997, "r_x1": 281.88, "r_y1": 146.51099999999997, "r_x2": 281.88, "r_y2": 141.79999999999995, "r_x3": 274.182, "r_y3": 141.79999999999995, "coord_origin": "TOPLEFT"}, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 226.698, "r_y0": 90.63800000000003, "r_x1": 241.912, "r_y1": 90.63800000000003, "r_x2": 241.912, "r_y2": 85.92700000000002, "r_x3": 226.698, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.939, "r_y0": 90.99300000000005, "r_x1": 282.494, "r_y1": 91.0, "r_x2": 282.494, "r_y2": 86.28899999999999, "r_x3": 249.939, "r_y3": 86.28200000000004, "coord_origin": "TOPLEFT"}, "text": "91K 10K10K", "orig": "91K 10K10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.194, "r_y0": 146.18100000000004, "r_x1": 434.278, "r_y1": 146.32799999999997, "r_x2": 434.278, "r_y2": 141.61699999999996, "r_x3": 410.194, "r_y3": 141.47000000000003, "coord_origin": "TOPLEFT"}, "text": "Train Test", "orig": "Train Test", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.991, "r_y0": 146.32799999999997, "r_x1": 444.689, "r_y1": 146.32799999999997, "r_x2": 444.689, "r_y2": 141.61699999999996, "r_x3": 436.991, "r_y3": 141.61699999999996, "coord_origin": "TOPLEFT"}, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.373, "r_y0": 90.63800000000003, "r_x1": 406.587, "r_y1": 90.63800000000003, "r_x2": 406.587, "r_y2": 85.92700000000002, "r_x3": 391.373, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.521, "r_y0": 91.12800000000004, "r_x1": 445.624, "r_y1": 91.16600000000005, "r_x2": 445.624, "r_y2": 86.45500000000004, "r_x3": 410.521, "r_y3": 86.41700000000003, "coord_origin": "TOPLEFT"}, "text": "130K 5K 10K", "orig": "130K 5K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.949, "r_y0": 146.19299999999998, "r_x1": 156.042, "r_y1": 146.341, "r_x2": 156.042, "r_y2": 141.63, "r_x3": 113.949, "r_y3": 141.48199999999997, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.916, "r_y0": 99.72299999999996, "r_x1": 127.054, "r_y1": 99.72299999999996, "r_x2": 127.054, "r_y2": 95.01199999999994, "r_x3": 116.916, "r_y3": 95.01199999999994, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.315, "r_y0": 105.84299999999996, "r_x1": 127.053, "r_y1": 105.84299999999996, "r_x2": 127.053, "r_y2": 101.13199999999995, "r_x3": 113.315, "r_y3": 101.13199999999995, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.941, "r_y0": 111.96299999999997, "r_x1": 127.055, "r_y1": 111.96299999999997, "r_x2": 127.055, "r_y2": 107.25199999999995, "r_x3": 112.941, "r_y3": 107.25199999999995, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.227, "r_y0": 127.51999999999998, "r_x1": 126.966, "r_y1": 127.51999999999998, "r_x2": 126.966, "r_y2": 122.80899999999997, "r_x3": 113.227, "r_y3": 122.80899999999997, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.854, "r_y0": 133.64, "r_x1": 126.968, "r_y1": 133.64, "r_x2": 126.968, "r_y2": 128.92899999999997, "r_x3": 112.854, "r_y3": 128.92899999999997, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.031, "r_y0": 91.17600000000004, "r_x1": 151.042, "r_y1": 91.17100000000005, "r_x2": 151.042, "r_y2": 86.46000000000004, "r_x3": 122.031, "r_y3": 86.46500000000003, "coord_origin": "TOPLEFT"}, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 311.654, "r_y0": 91.46000000000004, "r_x1": 321.672, "r_y1": 91.46000000000004, "r_x2": 321.672, "r_y2": 86.74900000000002, "r_x3": 311.654, "r_y3": 86.74900000000002, "coord_origin": "TOPLEFT"}, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 287.894, "r_y0": 146.615, "r_x1": 328.809, "r_y1": 146.615, "r_x2": 328.809, "r_y2": 141.904, "r_x3": 287.894, "r_y3": 141.904, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.236, "r_y0": 97.98500000000001, "r_x1": 299.375, "r_y1": 97.98500000000001, "r_x2": 299.375, "r_y2": 93.274, "r_x3": 289.236, "r_y3": 93.274, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.635, "r_y0": 104.10500000000002, "r_x1": 299.373, "r_y1": 104.10500000000002, "r_x2": 299.373, "r_y2": 99.394, "r_x3": 285.635, "r_y3": 99.394, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.261, "r_y0": 110.22500000000002, "r_x1": 299.375, "r_y1": 110.22500000000002, "r_x2": 299.375, "r_y2": 105.51400000000001, "r_x3": 285.261, "r_y3": 105.51400000000001, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.431, "r_y0": 125.29499999999996, "r_x1": 299.169, "r_y1": 125.29499999999996, "r_x2": 299.169, "r_y2": 120.58399999999995, "r_x3": 285.431, "r_y3": 120.58399999999995, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.057, "r_y0": 131.41499999999996, "r_x1": 299.171, "r_y1": 131.41499999999996, "r_x2": 299.171, "r_y2": 126.70399999999995, "r_x3": 285.057, "r_y3": 126.70399999999995, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 299.584, "r_y0": 91.59799999999996, "r_x1": 309.602, "r_y1": 91.59799999999996, "r_x2": 309.602, "r_y2": 86.88699999999994, "r_x3": 299.584, "r_y3": 86.88699999999994, "coord_origin": "TOPLEFT"}, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.041, "r_y0": 146.57600000000002, "r_x1": 483.504, "r_y1": 146.57600000000002, "r_x2": 483.504, "r_y2": 141.86599999999999, "r_x3": 466.041, "r_y3": 141.86599999999999, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.022, "r_y0": 98.66600000000005, "r_x1": 469.16, "r_y1": 98.66600000000005, "r_x2": 469.16, "r_y2": 93.95500000000004, "r_x3": 459.022, "r_y3": 93.95500000000004, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.421, "r_y0": 104.78599999999994, "r_x1": 469.159, "r_y1": 104.78599999999994, "r_x2": 469.159, "r_y2": 100.07500000000005, "r_x3": 455.421, "r_y3": 100.07500000000005, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.047, "r_y0": 110.90599999999995, "r_x1": 469.161, "r_y1": 110.90599999999995, "r_x2": 469.161, "r_y2": 106.19500000000005, "r_x3": 455.047, "r_y3": 106.19500000000005, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 467.394, "r_y0": 90.47699999999998, "r_x1": 480.655, "r_y1": 90.47699999999998, "r_x2": 480.655, "r_y2": 85.76599999999996, "r_x3": 467.394, "r_y3": 85.76599999999996, "coord_origin": "TOPLEFT"}, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.377, "r_y0": 146.48900000000003, "r_x1": 202.841, "r_y1": 146.61599999999999, "r_x2": 202.841, "r_y2": 141.90499999999997, "r_x3": 160.377, "r_y3": 141.77800000000002, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.743, "r_y0": 99.76999999999998, "r_x1": 173.327, "r_y1": 99.76999999999998, "r_x2": 173.327, "r_y2": 95.05899999999997, "r_x3": 153.743, "r_y3": 95.05899999999997, "coord_origin": "TOPLEFT"}, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.51, "r_y0": 105.88999999999999, "r_x1": 173.325, "r_y1": 105.88999999999999, "r_x2": 173.325, "r_y2": 101.17899999999997, "r_x3": 154.51, "r_y3": 101.17899999999997, "coord_origin": "TOPLEFT"}, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.272, "r_y0": 112.00999999999999, "r_x1": 173.327, "r_y1": 112.00999999999999, "r_x2": 173.327, "r_y2": 107.29899999999998, "r_x3": 155.272, "r_y3": 107.29899999999998, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.413, "r_y0": 112.13699999999994, "r_x1": 345.997, "r_y1": 112.13699999999994, "r_x2": 345.997, "r_y2": 107.42600000000004, "r_x3": 326.413, "r_y3": 107.42600000000004, "coord_origin": "TOPLEFT"}, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.18, "r_y0": 118.25699999999995, "r_x1": 345.995, "r_y1": 118.25699999999995, "r_x2": 345.995, "r_y2": 113.54600000000005, "r_x3": 327.18, "r_y3": 113.54600000000005, "coord_origin": "TOPLEFT"}, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.941, "r_y0": 124.37699999999995, "r_x1": 345.996, "r_y1": 124.37699999999995, "r_x2": 345.996, "r_y2": 119.66600000000005, "r_x3": 327.941, "r_y3": 119.66600000000005, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.994, "r_y0": 109.05899999999997, "r_x1": 508.764, "r_y1": 109.05899999999997, "r_x2": 508.764, "r_y2": 104.34799999999996, "r_x3": 488.994, "r_y3": 104.34799999999996, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.189, "r_y0": 115.17899999999997, "r_x1": 508.764, "r_y1": 115.17899999999997, "r_x2": 508.764, "r_y2": 110.46799999999996, "r_x3": 490.189, "r_y3": 110.46799999999996, "coord_origin": "TOPLEFT"}, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.72, "r_y0": 121.29899999999998, "r_x1": 508.768, "r_y1": 121.29899999999998, "r_x2": 508.768, "r_y2": 116.58799999999997, "r_x3": 489.72, "r_y3": 116.58799999999997, "coord_origin": "TOPLEFT"}, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.711, "r_y0": 127.41899999999998, "r_x1": 508.766, "r_y1": 127.41899999999998, "r_x2": 508.766, "r_y2": 122.70799999999997, "r_x3": 490.711, "r_y3": 122.70799999999997, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.504, "r_y0": 91.04100000000005, "r_x1": 197.527, "r_y1": 91.0, "r_x2": 197.527, "r_y2": 86.28899999999999, "r_x3": 168.504, "r_y3": 86.33000000000004, "coord_origin": "TOPLEFT"}, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.377, "r_y0": 90.90200000000004, "r_x1": 367.395, "r_y1": 90.90200000000004, "r_x2": 367.395, "r_y2": 86.19100000000003, "r_x3": 357.377, "r_y3": 86.19100000000003, "coord_origin": "TOPLEFT"}, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.732, "r_y0": 146.52800000000002, "r_x1": 374.929, "r_y1": 146.52800000000002, "r_x2": 374.929, "r_y2": 141.817, "r_x3": 333.732, "r_y3": 141.817, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.691, "r_y0": 90.96100000000001, "r_x1": 355.709, "r_y1": 90.96100000000001, "r_x2": 355.709, "r_y2": 86.25, "r_x3": 345.691, "r_y3": 86.25, "coord_origin": "TOPLEFT"}, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 508.543, "r_y0": 146.28200000000004, "r_x1": 526.006, "r_y1": 146.28200000000004, "r_x2": 526.006, "r_y2": 141.57100000000003, "r_x3": 508.543, "r_y3": 141.57100000000003, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 510.447, "r_y0": 90.99699999999996, "r_x1": 523.707, "r_y1": 90.99699999999996, "r_x2": 523.707, "r_y2": 86.28599999999994, "r_x3": 510.447, "r_y3": 86.28599999999994, "coord_origin": "TOPLEFT"}, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 46, "label": "text", "bbox": {"l": 119.391, "t": 77.543, "r": 151.946, "b": 83.19600000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.391, "r_y0": 83.19600000000003, "r_x1": 151.946, "r_y1": 83.19600000000003, "r_x2": 151.946, "r_y2": 77.543, "r_x3": 119.391, "r_y3": 77.543, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 53.346, "t": 75.42399999999998, "r": 59.327, "b": 81.077, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.346, "r_y0": 81.077, "r_x1": 59.327, "r_y1": 81.077, "r_x2": 59.327, "r_y2": 75.42399999999998, "r_x3": 53.346, "r_y3": 75.42399999999998, "coord_origin": "TOPLEFT"}, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 289.579, "t": 77.69100000000003, "r": 319.827, "b": 83.34400000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.579, "r_y0": 83.34400000000005, "r_x1": 319.827, "r_y1": 83.34400000000005, "r_x2": 319.827, "r_y2": 77.69100000000003, "r_x3": 289.579, "r_y3": 77.69100000000003, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 448.373, "t": 77.48699999999997, "r": 481.759, "b": 83.13999999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.373, "r_y0": 83.13999999999999, "r_x1": 481.759, "r_y1": 83.13999999999999, "r_x2": 481.759, "r_y2": 77.48699999999997, "r_x3": 448.373, "r_y3": 77.48699999999997, "coord_origin": "TOPLEFT"}, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 82.553, "t": 141.47000000000003, "r": 105.08, "b": 146.18100000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.553, "r_y0": 146.18100000000004, "r_x1": 105.08, "r_y1": 146.18100000000004, "r_x2": 105.08, "r_y2": 141.47000000000003, "r_x3": 82.553, "r_y3": 141.47000000000003, "coord_origin": "TOPLEFT"}, "text": "Train Val", "orig": "Train Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 63.039, "t": 101.298, "r": 85.29, "b": 106.00900000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 63.039, "r_y0": 106.00900000000001, "r_x1": 85.29, "r_y1": 106.00900000000001, "r_x2": 85.29, "r_y2": 101.298, "r_x3": 63.039, "r_y3": 101.298, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 67.768, "t": 124.58900000000006, "r": 85.231, "b": 129.29999999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 67.768, "r_y0": 129.29999999999995, "r_x1": 85.231, "r_y1": 129.29999999999995, "r_x2": 85.231, "r_y2": 124.58900000000006, "r_x3": 67.768, "r_y3": 124.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 227.551, "t": 102.73400000000004, "r": 249.803, "b": 107.44500000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.551, "r_y0": 107.44500000000005, "r_x1": 249.803, "r_y1": 107.44500000000005, "r_x2": 249.803, "r_y2": 102.73400000000004, "r_x3": 227.551, "r_y3": 102.73400000000004, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 232.199, "t": 127.17999999999995, "r": 249.662, "b": 131.89099999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.199, "r_y0": 131.89099999999996, "r_x1": 249.662, "r_y1": 131.89099999999996, "r_x2": 249.662, "r_y2": 127.17999999999995, "r_x3": 232.199, "r_y3": 127.17999999999995, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 396.234, "t": 114.23900000000003, "r": 413.697, "b": 118.95000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.234, "r_y0": 118.95000000000005, "r_x1": 413.697, "r_y1": 118.95000000000005, "r_x2": 413.697, "r_y2": 114.23900000000003, "r_x3": 396.234, "r_y3": 114.23900000000003, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 60.938, "t": 85.92700000000002, "r": 76.151, "b": 90.63800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.938, "r_y0": 90.63800000000003, "r_x1": 76.151, "r_y1": 90.63800000000003, "r_x2": 76.151, "r_y2": 85.92700000000002, "r_x3": 60.938, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 82.305, "t": 86.39599999999996, "r": 106.992, "b": 91.12800000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.305, "r_y0": 91.12800000000004, "r_x1": 106.992, "r_y1": 91.10699999999997, "r_x2": 106.992, "r_y2": 86.39599999999996, "r_x3": 82.305, "r_y3": 86.41700000000003, "coord_origin": "TOPLEFT"}, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 246.205, "t": 141.79999999999995, "r": 271.386, "b": 146.51099999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.205, "r_y0": 146.51099999999997, "r_x1": 271.386, "r_y1": 146.51099999999997, "r_x2": 271.386, "r_y2": 141.79999999999995, "r_x3": 246.205, "r_y3": 141.79999999999995, "coord_origin": "TOPLEFT"}, "text": "Train Test", "orig": "Train Test", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 274.182, "t": 141.79999999999995, "r": 281.88, "b": 146.51099999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.182, "r_y0": 146.51099999999997, "r_x1": 281.88, "r_y1": 146.51099999999997, "r_x2": 281.88, "r_y2": 141.79999999999995, "r_x3": 274.182, "r_y3": 141.79999999999995, "coord_origin": "TOPLEFT"}, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 226.698, "t": 85.92700000000002, "r": 241.912, "b": 90.63800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 226.698, "r_y0": 90.63800000000003, "r_x1": 241.912, "r_y1": 90.63800000000003, "r_x2": 241.912, "r_y2": 85.92700000000002, "r_x3": 226.698, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 249.939, "t": 86.28200000000004, "r": 282.494, "b": 91.0, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.939, "r_y0": 90.99300000000005, "r_x1": 282.494, "r_y1": 91.0, "r_x2": 282.494, "r_y2": 86.28899999999999, "r_x3": 249.939, "r_y3": 86.28200000000004, "coord_origin": "TOPLEFT"}, "text": "91K 10K10K", "orig": "91K 10K10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 410.194, "t": 141.47000000000003, "r": 434.278, "b": 146.32799999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.194, "r_y0": 146.18100000000004, "r_x1": 434.278, "r_y1": 146.32799999999997, "r_x2": 434.278, "r_y2": 141.61699999999996, "r_x3": 410.194, "r_y3": 141.47000000000003, "coord_origin": "TOPLEFT"}, "text": "Train Test", "orig": "Train Test", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 436.991, "t": 141.61699999999996, "r": 444.689, "b": 146.32799999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.991, "r_y0": 146.32799999999997, "r_x1": 444.689, "r_y1": 146.32799999999997, "r_x2": 444.689, "r_y2": 141.61699999999996, "r_x3": 436.991, "r_y3": 141.61699999999996, "coord_origin": "TOPLEFT"}, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 391.373, "t": 85.92700000000002, "r": 406.587, "b": 90.63800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.373, "r_y0": 90.63800000000003, "r_x1": 406.587, "r_y1": 90.63800000000003, "r_x2": 406.587, "r_y2": 85.92700000000002, "r_x3": 391.373, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 410.521, "t": 86.41700000000003, "r": 445.624, "b": 91.16600000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.521, "r_y0": 91.12800000000004, "r_x1": 445.624, "r_y1": 91.16600000000005, "r_x2": 445.624, "r_y2": 86.45500000000004, "r_x3": 410.521, "r_y3": 86.41700000000003, "coord_origin": "TOPLEFT"}, "text": "130K 5K 10K", "orig": "130K 5K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 113.949, "t": 141.48199999999997, "r": 156.042, "b": 146.341, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.949, "r_y0": 146.19299999999998, "r_x1": 156.042, "r_y1": 146.341, "r_x2": 156.042, "r_y2": 141.63, "r_x3": 113.949, "r_y3": 141.48199999999997, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 116.916, "t": 95.01199999999994, "r": 127.054, "b": 99.72299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.916, "r_y0": 99.72299999999996, "r_x1": 127.054, "r_y1": 99.72299999999996, "r_x2": 127.054, "r_y2": 95.01199999999994, "r_x3": 116.916, "r_y3": 95.01199999999994, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 113.315, "t": 101.13199999999995, "r": 127.053, "b": 105.84299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.315, "r_y0": 105.84299999999996, "r_x1": 127.053, "r_y1": 105.84299999999996, "r_x2": 127.053, "r_y2": 101.13199999999995, "r_x3": 113.315, "r_y3": 101.13199999999995, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 112.941, "t": 107.25199999999995, "r": 127.055, "b": 111.96299999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.941, "r_y0": 111.96299999999997, "r_x1": 127.055, "r_y1": 111.96299999999997, "r_x2": 127.055, "r_y2": 107.25199999999995, "r_x3": 112.941, "r_y3": 107.25199999999995, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 113.227, "t": 122.80899999999997, "r": 126.966, "b": 127.51999999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.227, "r_y0": 127.51999999999998, "r_x1": 126.966, "r_y1": 127.51999999999998, "r_x2": 126.966, "r_y2": 122.80899999999997, "r_x3": 113.227, "r_y3": 122.80899999999997, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 112.854, "t": 128.92899999999997, "r": 126.968, "b": 133.64, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.854, "r_y0": 133.64, "r_x1": 126.968, "r_y1": 133.64, "r_x2": 126.968, "r_y2": 128.92899999999997, "r_x3": 112.854, "r_y3": 128.92899999999997, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 122.031, "t": 86.46000000000004, "r": 151.042, "b": 91.17600000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.031, "r_y0": 91.17600000000004, "r_x1": 151.042, "r_y1": 91.17100000000005, "r_x2": 151.042, "r_y2": 86.46000000000004, "r_x3": 122.031, "r_y3": 86.46500000000003, "coord_origin": "TOPLEFT"}, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 311.654, "t": 86.74900000000002, "r": 321.672, "b": 91.46000000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 311.654, "r_y0": 91.46000000000004, "r_x1": 321.672, "r_y1": 91.46000000000004, "r_x2": 321.672, "r_y2": 86.74900000000002, "r_x3": 311.654, "r_y3": 86.74900000000002, "coord_origin": "TOPLEFT"}, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 287.894, "t": 141.904, "r": 328.809, "b": 146.615, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 287.894, "r_y0": 146.615, "r_x1": 328.809, "r_y1": 146.615, "r_x2": 328.809, "r_y2": 141.904, "r_x3": 287.894, "r_y3": 141.904, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 289.236, "t": 93.274, "r": 299.375, "b": 97.98500000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.236, "r_y0": 97.98500000000001, "r_x1": 299.375, "r_y1": 97.98500000000001, "r_x2": 299.375, "r_y2": 93.274, "r_x3": 289.236, "r_y3": 93.274, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 285.635, "t": 99.394, "r": 299.373, "b": 104.10500000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.635, "r_y0": 104.10500000000002, "r_x1": 299.373, "r_y1": 104.10500000000002, "r_x2": 299.373, "r_y2": 99.394, "r_x3": 285.635, "r_y3": 99.394, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 285.261, "t": 105.51400000000001, "r": 299.375, "b": 110.22500000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.261, "r_y0": 110.22500000000002, "r_x1": 299.375, "r_y1": 110.22500000000002, "r_x2": 299.375, "r_y2": 105.51400000000001, "r_x3": 285.261, "r_y3": 105.51400000000001, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 285.431, "t": 120.58399999999995, "r": 299.169, "b": 125.29499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.431, "r_y0": 125.29499999999996, "r_x1": 299.169, "r_y1": 125.29499999999996, "r_x2": 299.169, "r_y2": 120.58399999999995, "r_x3": 285.431, "r_y3": 120.58399999999995, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 285.057, "t": 126.70399999999995, "r": 299.171, "b": 131.41499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.057, "r_y0": 131.41499999999996, "r_x1": 299.171, "r_y1": 131.41499999999996, "r_x2": 299.171, "r_y2": 126.70399999999995, "r_x3": 285.057, "r_y3": 126.70399999999995, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 299.584, "t": 86.88699999999994, "r": 309.602, "b": 91.59799999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 299.584, "r_y0": 91.59799999999996, "r_x1": 309.602, "r_y1": 91.59799999999996, "r_x2": 309.602, "r_y2": 86.88699999999994, "r_x3": 299.584, "r_y3": 86.88699999999994, "coord_origin": "TOPLEFT"}, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 466.041, "t": 141.86599999999999, "r": 483.504, "b": 146.57600000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.041, "r_y0": 146.57600000000002, "r_x1": 483.504, "r_y1": 146.57600000000002, "r_x2": 483.504, "r_y2": 141.86599999999999, "r_x3": 466.041, "r_y3": 141.86599999999999, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 82, "label": "text", "bbox": {"l": 459.022, "t": 93.95500000000004, "r": 469.16, "b": 98.66600000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.022, "r_y0": 98.66600000000005, "r_x1": 469.16, "r_y1": 98.66600000000005, "r_x2": 469.16, "r_y2": 93.95500000000004, "r_x3": 459.022, "r_y3": 93.95500000000004, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 83, "label": "text", "bbox": {"l": 455.421, "t": 100.07500000000005, "r": 469.159, "b": 104.78599999999994, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.421, "r_y0": 104.78599999999994, "r_x1": 469.159, "r_y1": 104.78599999999994, "r_x2": 469.159, "r_y2": 100.07500000000005, "r_x3": 455.421, "r_y3": 100.07500000000005, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 455.047, "t": 106.19500000000005, "r": 469.161, "b": 110.90599999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.047, "r_y0": 110.90599999999995, "r_x1": 469.161, "r_y1": 110.90599999999995, "r_x2": 469.161, "r_y2": 106.19500000000005, "r_x3": 455.047, "r_y3": 106.19500000000005, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 467.394, "t": 85.76599999999996, "r": 480.655, "b": 90.47699999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 467.394, "r_y0": 90.47699999999998, "r_x1": 480.655, "r_y1": 90.47699999999998, "r_x2": 480.655, "r_y2": 85.76599999999996, "r_x3": 467.394, "r_y3": 85.76599999999996, "coord_origin": "TOPLEFT"}, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 86, "label": "text", "bbox": {"l": 160.377, "t": 141.77800000000002, "r": 202.841, "b": 146.61599999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.377, "r_y0": 146.48900000000003, "r_x1": 202.841, "r_y1": 146.61599999999999, "r_x2": 202.841, "r_y2": 141.90499999999997, "r_x3": 160.377, "r_y3": 141.77800000000002, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 153.743, "t": 95.05899999999997, "r": 173.327, "b": 99.76999999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.743, "r_y0": 99.76999999999998, "r_x1": 173.327, "r_y1": 99.76999999999998, "r_x2": 173.327, "r_y2": 95.05899999999997, "r_x3": 153.743, "r_y3": 95.05899999999997, "coord_origin": "TOPLEFT"}, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 88, "label": "text", "bbox": {"l": 154.51, "t": 101.17899999999997, "r": 173.325, "b": 105.88999999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.51, "r_y0": 105.88999999999999, "r_x1": 173.325, "r_y1": 105.88999999999999, "r_x2": 173.325, "r_y2": 101.17899999999997, "r_x3": 154.51, "r_y3": 101.17899999999997, "coord_origin": "TOPLEFT"}, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 155.272, "t": 107.29899999999998, "r": 173.327, "b": 112.00999999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.272, "r_y0": 112.00999999999999, "r_x1": 173.327, "r_y1": 112.00999999999999, "r_x2": 173.327, "r_y2": 107.29899999999998, "r_x3": 155.272, "r_y3": 107.29899999999998, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 326.413, "t": 107.42600000000004, "r": 345.997, "b": 112.13699999999994, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.413, "r_y0": 112.13699999999994, "r_x1": 345.997, "r_y1": 112.13699999999994, "r_x2": 345.997, "r_y2": 107.42600000000004, "r_x3": 326.413, "r_y3": 107.42600000000004, "coord_origin": "TOPLEFT"}, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 91, "label": "text", "bbox": {"l": 327.18, "t": 113.54600000000005, "r": 345.995, "b": 118.25699999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.18, "r_y0": 118.25699999999995, "r_x1": 345.995, "r_y1": 118.25699999999995, "r_x2": 345.995, "r_y2": 113.54600000000005, "r_x3": 327.18, "r_y3": 113.54600000000005, "coord_origin": "TOPLEFT"}, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 92, "label": "text", "bbox": {"l": 327.941, "t": 119.66600000000005, "r": 345.996, "b": 124.37699999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.941, "r_y0": 124.37699999999995, "r_x1": 345.996, "r_y1": 124.37699999999995, "r_x2": 345.996, "r_y2": 119.66600000000005, "r_x3": 327.941, "r_y3": 119.66600000000005, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 93, "label": "text", "bbox": {"l": 488.994, "t": 104.34799999999996, "r": 508.764, "b": 109.05899999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.994, "r_y0": 109.05899999999997, "r_x1": 508.764, "r_y1": 109.05899999999997, "r_x2": 508.764, "r_y2": 104.34799999999996, "r_x3": 488.994, "r_y3": 104.34799999999996, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 94, "label": "text", "bbox": {"l": 490.189, "t": 110.46799999999996, "r": 508.764, "b": 115.17899999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.189, "r_y0": 115.17899999999997, "r_x1": 508.764, "r_y1": 115.17899999999997, "r_x2": 508.764, "r_y2": 110.46799999999996, "r_x3": 490.189, "r_y3": 110.46799999999996, "coord_origin": "TOPLEFT"}, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 95, "label": "text", "bbox": {"l": 489.72, "t": 116.58799999999997, "r": 508.768, "b": 121.29899999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.72, "r_y0": 121.29899999999998, "r_x1": 508.768, "r_y1": 121.29899999999998, "r_x2": 508.768, "r_y2": 116.58799999999997, "r_x3": 489.72, "r_y3": 116.58799999999997, "coord_origin": "TOPLEFT"}, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 96, "label": "text", "bbox": {"l": 490.711, "t": 122.70799999999997, "r": 508.766, "b": 127.41899999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.711, "r_y0": 127.41899999999998, "r_x1": 508.766, "r_y1": 127.41899999999998, "r_x2": 508.766, "r_y2": 122.70799999999997, "r_x3": 490.711, "r_y3": 122.70799999999997, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 97, "label": "text", "bbox": {"l": 168.504, "t": 86.28899999999999, "r": 197.527, "b": 91.04100000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.504, "r_y0": 91.04100000000005, "r_x1": 197.527, "r_y1": 91.0, "r_x2": 197.527, "r_y2": 86.28899999999999, "r_x3": 168.504, "r_y3": 86.33000000000004, "coord_origin": "TOPLEFT"}, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 98, "label": "text", "bbox": {"l": 357.377, "t": 86.19100000000003, "r": 367.395, "b": 90.90200000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.377, "r_y0": 90.90200000000004, "r_x1": 367.395, "r_y1": 90.90200000000004, "r_x2": 367.395, "r_y2": 86.19100000000003, "r_x3": 357.377, "r_y3": 86.19100000000003, "coord_origin": "TOPLEFT"}, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 99, "label": "text", "bbox": {"l": 333.732, "t": 141.817, "r": 374.929, "b": 146.52800000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.732, "r_y0": 146.52800000000002, "r_x1": 374.929, "r_y1": 146.52800000000002, "r_x2": 374.929, "r_y2": 141.817, "r_x3": 333.732, "r_y3": 141.817, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 100, "label": "text", "bbox": {"l": 345.691, "t": 86.25, "r": 355.709, "b": 90.96100000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.691, "r_y0": 90.96100000000001, "r_x1": 355.709, "r_y1": 90.96100000000001, "r_x2": 355.709, "r_y2": 86.25, "r_x3": 345.691, "r_y3": 86.25, "coord_origin": "TOPLEFT"}, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 101, "label": "text", "bbox": {"l": 508.543, "t": 141.57100000000003, "r": 526.006, "b": 146.28200000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 508.543, "r_y0": 146.28200000000004, "r_x1": 526.006, "r_y1": 146.28200000000004, "r_x2": 526.006, "r_y2": 141.57100000000003, "r_x3": 508.543, "r_y3": 141.57100000000003, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 102, "label": "text", "bbox": {"l": 510.447, "t": 86.28599999999994, "r": 523.707, "b": 90.99699999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 510.447, "r_y0": 90.99699999999996, "r_x1": 523.707, "r_y1": 90.99699999999996, "r_x2": 523.707, "r_y2": 86.28599999999994, "r_x3": 510.447, "r_y3": 86.28599999999994, "coord_origin": "TOPLEFT"}, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, {"id": 1, "label": "caption", "bbox": {"l": 50.112, "t": 165.77099999999996, "r": 545.114, "b": 186.27800000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9661495685577393, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 174.32299999999998, "r_x1": 86.585, "r_y1": 174.32299999999998, "r_x2": 86.585, "r_y2": 165.77099999999996, "r_x3": 50.112, "r_y3": 165.77099999999996, "coord_origin": "TOPLEFT"}, "text": "Figure 7:", "orig": "Figure 7:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.832, "r_y0": 174.32299999999998, "r_x1": 545.114, "r_y1": 174.32299999999998, "r_x2": 545.114, "r_y2": 165.77099999999996, "r_x3": 92.832, "r_y3": 165.77099999999996, "coord_origin": "TOPLEFT"}, "text": "Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "orig": "Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 186.27800000000002, "r_x1": 513.522, "r_y1": 186.27800000000002, "r_x2": 513.522, "r_y2": 177.726, "r_x3": 50.112, "r_y3": 177.726, "coord_origin": "TOPLEFT"}, "text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "list_item", "bbox": {"l": 61.569, "t": 211.20000000000005, "r": 286.365, "b": 231.707, "coord_origin": "TOPLEFT"}, "confidence": 0.9621952772140503, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 219.75199999999995, "r_x1": 65.056, "r_y1": 219.75199999999995, "r_x2": 65.056, "r_y2": 211.20000000000005, "r_x3": 61.569, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 219.75199999999995, "r_x1": 286.365, "r_y1": 219.75199999999995, "r_x2": 286.365, "r_y2": 211.20000000000005, "r_x3": 70.037, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "TableFormer output does not include the table cell con-", "orig": "TableFormer output does not include the table cell con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 231.707, "r_x1": 87.472, "r_y1": 231.707, "r_x2": 87.472, "r_y2": 223.15499999999997, "r_x3": 70.037, "r_y3": 223.15499999999997, "coord_origin": "TOPLEFT"}, "text": "tent.", "orig": "tent.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "list_item", "bbox": {"l": 61.569, "t": 244.34000000000003, "r": 286.365, "b": 264.847, "coord_origin": "TOPLEFT"}, "confidence": 0.9629555344581604, "cells": [{"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 252.89200000000005, "r_x1": 65.056, "r_y1": 252.89200000000005, "r_x2": 65.056, "r_y2": 244.34000000000003, "r_x3": 61.569, "r_y3": 244.34000000000003, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 252.89200000000005, "r_x1": 286.365, "r_y1": 252.89200000000005, "r_x2": 286.365, "r_y2": 244.34000000000003, "r_x3": 70.037, "r_y3": 244.34000000000003, "coord_origin": "TOPLEFT"}, "text": "There are occasional inaccuracies in the predictions of", "orig": "There are occasional inaccuracies in the predictions of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 264.847, "r_x1": 150.415, "r_y1": 264.847, "r_x2": 150.415, "r_y2": 256.29499999999996, "r_x3": 70.037, "r_y3": 256.29499999999996, "coord_origin": "TOPLEFT"}, "text": "the bounding boxes.", "orig": "the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 0, "label": "text", "bbox": {"l": 50.112, "t": 279.472, "r": 286.365, "b": 395.621, "coord_origin": "TOPLEFT"}, "confidence": 0.9767085909843445, "cells": [{"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 288.024, "r_x1": 286.365, "r_y1": 288.024, "r_x2": 286.365, "r_y2": 279.472, "r_x3": 62.067, "r_y3": 279.472, "coord_origin": "TOPLEFT"}, "text": "However, it is possible to mitigate those limitations by", "orig": "However, it is possible to mitigate those limitations by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 299.979, "r_x1": 286.365, "r_y1": 299.979, "r_x2": 286.365, "r_y2": 291.427, "r_x3": 50.112, "r_y3": 291.427, "coord_origin": "TOPLEFT"}, "text": "combining the TableFormer predictions with the informa-", "orig": "combining the TableFormer predictions with the informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 311.934, "r_x1": 286.365, "r_y1": 311.934, "r_x2": 286.365, "r_y2": 303.382, "r_x3": 50.112, "r_y3": 303.382, "coord_origin": "TOPLEFT"}, "text": "tion already present inside a programmatic PDF document.", "orig": "tion already present inside a programmatic PDF document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 323.889, "r_x1": 123.387, "r_y1": 323.889, "r_x2": 123.387, "r_y2": 315.337, "r_x3": 50.112, "r_y3": 315.337, "coord_origin": "TOPLEFT"}, "text": "More specifically,", "orig": "More specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.348, "r_y0": 323.889, "r_x1": 286.365, "r_y1": 323.889, "r_x2": 286.365, "r_y2": 315.337, "r_x3": 128.348, "r_y3": 315.337, "coord_origin": "TOPLEFT"}, "text": "PDF documents can be seen as a se-", "orig": "PDF documents can be seen as a se-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 335.845, "r_x1": 286.365, "r_y1": 335.845, "r_x2": 286.365, "r_y2": 327.293, "r_x3": 50.112, "r_y3": 327.293, "coord_origin": "TOPLEFT"}, "text": "quence of PDF cells where each cell is described by its con-", "orig": "quence of PDF cells where each cell is described by its con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 347.8, "r_x1": 286.365, "r_y1": 347.8, "r_x2": 286.365, "r_y2": 339.248, "r_x3": 50.112, "r_y3": 339.248, "coord_origin": "TOPLEFT"}, "text": "tent and bounding box. If we are able to associate the PDF", "orig": "tent and bounding box. If we are able to associate the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 359.755, "r_x1": 286.365, "r_y1": 359.755, "r_x2": 286.365, "r_y2": 351.203, "r_x3": 50.112, "r_y3": 351.203, "coord_origin": "TOPLEFT"}, "text": "cells with the predicted table cells, we can directly link the", "orig": "cells with the predicted table cells, we can directly link the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 371.71, "r_x1": 286.365, "r_y1": 371.71, "r_x2": 286.365, "r_y2": 363.158, "r_x3": 50.112, "r_y3": 363.158, "coord_origin": "TOPLEFT"}, "text": "PDF cell content to the table cell structure and use the PDF", "orig": "PDF cell content to the table cell structure and use the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 383.665, "r_x1": 286.365, "r_y1": 383.665, "r_x2": 286.365, "r_y2": 375.113, "r_x3": 50.112, "r_y3": 375.113, "coord_origin": "TOPLEFT"}, "text": "bounding boxes to correct misalignments in the predicted", "orig": "bounding boxes to correct misalignments in the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 395.621, "r_x1": 154.56, "r_y1": 395.621, "r_x2": 154.56, "r_y2": 387.069, "r_x3": 50.112, "r_y3": 387.069, "coord_origin": "TOPLEFT"}, "text": "table cell bounding boxes.", "orig": "table cell bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "text", "bbox": {"l": 50.112, "t": 399.338, "r": 286.365, "b": 419.846, "coord_origin": "TOPLEFT"}, "confidence": 0.934766411781311, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 407.89, "r_x1": 286.365, "r_y1": 407.89, "r_x2": 286.365, "r_y2": 399.338, "r_x3": 62.067, "r_y3": 399.338, "coord_origin": "TOPLEFT"}, "text": "Here is a step-by-step description of the prediction post-", "orig": "Here is a step-by-step description of the prediction post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 419.846, "r_x1": 95.492, "r_y1": 419.846, "r_x2": 95.492, "r_y2": 411.294, "r_x3": 50.112, "r_y3": 411.294, "coord_origin": "TOPLEFT"}, "text": "processing:", "orig": "processing:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 20, "label": "list_item", "bbox": {"l": 50.112, "t": 423.564, "r": 286.365, "b": 456.026, "coord_origin": "TOPLEFT"}, "confidence": 0.8280702233314514, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 432.116, "r_x1": 286.365, "r_y1": 432.116, "r_x2": 286.365, "r_y2": 423.564, "r_x3": 62.067, "r_y3": 423.564, "coord_origin": "TOPLEFT"}, "text": "1. Get the minimal grid dimensions - number of rows and", "orig": "1. Get the minimal grid dimensions - number of rows and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 444.071, "r_x1": 218.779, "r_y1": 444.071, "r_x2": 218.779, "r_y2": 435.519, "r_x3": 50.112, "r_y3": 435.519, "coord_origin": "TOPLEFT"}, "text": "columns for the predicted table structure.", "orig": "columns for the predicted table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.796, "r_y0": 444.071, "r_x1": 286.365, "r_y1": 444.071, "r_x2": 286.365, "r_y2": 435.519, "r_x3": 224.796, "r_y3": 435.519, "coord_origin": "TOPLEFT"}, "text": "This represents", "orig": "This represents", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 456.026, "r_x1": 274.51, "r_y1": 456.026, "r_x2": 274.51, "r_y2": 447.474, "r_x3": 50.112, "r_y3": 447.474, "coord_origin": "TOPLEFT"}, "text": "the most granular grid for the underlying table structure.", "orig": "the most granular grid for the underlying table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "list_item", "bbox": {"l": 50.112, "t": 459.744, "r": 286.365, "b": 504.161, "coord_origin": "TOPLEFT"}, "confidence": 0.9646760821342468, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 468.296, "r_x1": 69.539, "r_y1": 468.296, "r_x2": 69.539, "r_y2": 459.744, "r_x3": 62.067, "r_y3": 459.744, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 77.429, "r_y0": 468.296, "r_x1": 286.365, "r_y1": 468.296, "r_x2": 286.365, "r_y2": 459.744, "r_x3": 77.429, "r_y3": 459.744, "coord_origin": "TOPLEFT"}, "text": "Generate pair-wise matches between the bounding", "orig": "Generate pair-wise matches between the bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 480.251, "r_x1": 286.365, "r_y1": 480.251, "r_x2": 286.365, "r_y2": 471.699, "r_x3": 50.112, "r_y3": 471.699, "coord_origin": "TOPLEFT"}, "text": "boxes of the PDF cells and the predicted cells. The Intersec-", "orig": "boxes of the PDF cells and the predicted cells. The Intersec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 492.206, "r_x1": 286.365, "r_y1": 492.206, "r_x2": 286.365, "r_y2": 483.654, "r_x3": 50.112, "r_y3": 483.654, "coord_origin": "TOPLEFT"}, "text": "tion Over Union (IOU) metric is used to evaluate the quality", "orig": "tion Over Union (IOU) metric is used to evaluate the quality", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 504.161, "r_x1": 110.705, "r_y1": 504.161, "r_x2": 110.705, "r_y2": 495.609, "r_x3": 50.112, "r_y3": 495.609, "coord_origin": "TOPLEFT"}, "text": "of the matches.", "orig": "of the matches.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 10, "label": "list_item", "bbox": {"l": 50.112, "t": 507.879, "r": 286.365, "b": 528.387, "coord_origin": "TOPLEFT"}, "confidence": 0.9391399025917053, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 516.431, "r_x1": 69.539, "r_y1": 516.431, "r_x2": 69.539, "r_y2": 507.879, "r_x3": 62.067, "r_y3": 507.879, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 75.248, "r_y0": 516.431, "r_x1": 286.365, "r_y1": 516.431, "r_x2": 286.365, "r_y2": 507.879, "r_x3": 75.248, "r_y3": 507.879, "coord_origin": "TOPLEFT"}, "text": "Use a carefully selected IOU threshold to designate", "orig": "Use a carefully selected IOU threshold to designate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 528.387, "r_x1": 226.071, "r_y1": 528.387, "r_x2": 226.071, "r_y2": 519.835, "r_x3": 50.112, "r_y3": 519.835, "coord_origin": "TOPLEFT"}, "text": "the matches as 'good' ones and 'bad' ones.", "orig": "the matches as 'good' ones and 'bad' ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "list_item", "bbox": {"l": 50.112, "t": 532.104, "r": 286.365, "b": 564.567, "coord_origin": "TOPLEFT"}, "confidence": 0.9491708874702454, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 540.656, "r_x1": 76.453, "r_y1": 540.656, "r_x2": 76.453, "r_y2": 532.104, "r_x3": 62.067, "r_y3": 532.104, "coord_origin": "TOPLEFT"}, "text": "3.a.", "orig": "3.a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 80.587, "r_y0": 540.656, "r_x1": 286.365, "r_y1": 540.656, "r_x2": 286.365, "r_y2": 532.104, "r_x3": 80.587, "r_y3": 532.104, "coord_origin": "TOPLEFT"}, "text": "If all IOU scores in a column are below the thresh-", "orig": "If all IOU scores in a column are below the thresh-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 552.612, "r_x1": 286.365, "r_y1": 552.612, "r_x2": 286.365, "r_y2": 544.06, "r_x3": 50.112, "r_y3": 544.06, "coord_origin": "TOPLEFT"}, "text": "old, discard all predictions (structure and bounding boxes)", "orig": "old, discard all predictions (structure and bounding boxes)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 564.567, "r_x1": 114.032, "r_y1": 564.567, "r_x2": 114.032, "r_y2": 556.015, "r_x3": 50.112, "r_y3": 556.015, "coord_origin": "TOPLEFT"}, "text": "for that column.", "orig": "for that column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "list_item", "bbox": {"l": 50.112, "t": 568.285, "r": 286.365, "b": 600.7470000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9587163329124451, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 576.837, "r_x1": 69.539, "r_y1": 576.837, "r_x2": 69.539, "r_y2": 568.285, "r_x3": 62.067, "r_y3": 568.285, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.732, "r_y0": 576.837, "r_x1": 286.365, "r_y1": 576.837, "r_x2": 286.365, "r_y2": 568.285, "r_x3": 76.732, "r_y3": 568.285, "coord_origin": "TOPLEFT"}, "text": "Find the best-fitting content alignment for the pre-", "orig": "Find the best-fitting content alignment for the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 588.792, "r_x1": 286.365, "r_y1": 588.792, "r_x2": 286.365, "r_y2": 580.24, "r_x3": 50.112, "r_y3": 580.24, "coord_origin": "TOPLEFT"}, "text": "dicted cells with good IOU per each column. The alignment", "orig": "dicted cells with good IOU per each column. The alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 600.7470000000001, "r_x1": 278.704, "r_y1": 600.7470000000001, "r_x2": 278.704, "r_y2": 592.1949999999999, "r_x3": 50.112, "r_y3": 592.1949999999999, "coord_origin": "TOPLEFT"}, "text": "of the column can be identified by the following formula:", "orig": "of the column can be identified by the following formula:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 12, "label": "formula", "bbox": {"l": 110.705, "t": 624.104, "r": 286.362, "b": 654.998, "coord_origin": "TOPLEFT"}, "confidence": 0.9298412799835205, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.028, "r_y0": 632.81, "r_x1": 157.952, "r_y1": 632.81, "r_x2": 157.952, "r_y2": 624.104, "r_x3": 112.028, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.715, "r_y0": 632.81, "r_x1": 203.496, "r_y1": 632.81, "r_x2": 203.496, "r_y2": 624.104, "r_x3": 160.715, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "= arg min", "orig": "= arg min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.585, "r_y0": 640.154, "r_x1": 189.145, "r_y1": 640.154, "r_x2": 189.145, "r_y2": 634.06, "r_x3": 185.585, "r_y3": 634.06, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 203.499, "r_y0": 632.668, "r_x1": 208.48, "r_y1": 632.668, "r_x2": 208.48, "r_y2": 624.104, "r_x3": 203.499, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.481, "r_y0": 632.81, "r_x1": 216.729, "r_y1": 632.81, "r_x2": 216.729, "r_y2": 624.104, "r_x3": 208.481, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.729, "r_y0": 633.734, "r_x1": 220.289, "r_y1": 633.734, "r_x2": 220.289, "r_y2": 627.64, "r_x3": 216.729, "r_y3": 627.64, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.787, "r_y0": 632.668, "r_x1": 225.768, "r_y1": 632.668, "r_x2": 225.768, "r_y2": 624.104, "r_x3": 220.787, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.705, "r_y0": 654.075, "r_x1": 118.953, "r_y1": 654.075, "r_x2": 118.953, "r_y2": 645.369, "r_x3": 110.705, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 118.953, "r_y0": 654.998, "r_x1": 122.513, "r_y1": 654.998, "r_x2": 122.513, "r_y2": 648.904, "r_x3": 118.953, "r_y3": 648.904, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.779, "r_y0": 654.075, "r_x1": 133.528, "r_y1": 654.075, "r_x2": 133.528, "r_y2": 645.369, "r_x3": 125.779, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 136.295, "r_y0": 654.075, "r_x1": 166.678, "r_y1": 654.075, "r_x2": 166.678, "r_y2": 645.369, "r_x3": 136.295, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "max x", "orig": "max x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 156.003, "r_y0": 653.933, "r_x1": 160.984, "r_y1": 653.933, "r_x2": 160.984, "r_y2": 645.369, "r_x3": 156.003, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.678, "r_y0": 654.998, "r_x1": 170.238, "r_y1": 654.998, "r_x2": 170.238, "r_y2": 648.904, "r_x3": 166.678, "r_y3": 648.904, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.736, "r_y0": 653.933, "r_x1": 185.678, "r_y1": 653.933, "r_x2": 185.678, "r_y2": 645.369, "r_x3": 170.736, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "} -", "orig": "} -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.894, "r_y0": 654.075, "r_x1": 216.729, "r_y1": 654.075, "r_x2": 216.729, "r_y2": 645.369, "r_x3": 187.894, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "min x", "orig": "min x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.054, "r_y0": 653.933, "r_x1": 211.035, "r_y1": 653.933, "r_x2": 211.035, "r_y2": 645.369, "r_x3": 206.054, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.729, "r_y0": 654.998, "r_x1": 220.289, "r_y1": 654.998, "r_x2": 220.289, "r_y2": 648.904, "r_x3": 216.729, "r_y3": 648.904, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.787, "r_y0": 653.933, "r_x1": 225.768, "r_y1": 653.933, "r_x2": 225.768, "r_y2": 645.369, "r_x3": 220.787, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.746, "r_y0": 643.706, "r_x1": 286.362, "r_y1": 643.706, "r_x2": 286.362, "r_y2": 635.154, "r_x3": 274.746, "r_y3": 635.154, "coord_origin": "TOPLEFT"}, "text": "(4)", "orig": "(4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "text", "bbox": {"l": 50.112, "t": 668.016, "r": 286.362, "b": 688.841, "coord_origin": "TOPLEFT"}, "confidence": 0.9545555114746094, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 676.886, "r_x1": 74.451, "r_y1": 676.886, "r_x2": 74.451, "r_y2": 668.3340000000001, "r_x3": 50.112, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.336, "r_y0": 676.722, "r_x1": 82.648, "r_y1": 676.722, "r_x2": 82.648, "r_y2": 668.016, "r_x3": 78.336, "r_y3": 668.016, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.533, "r_y0": 676.886, "r_x1": 93.178, "r_y1": 676.886, "r_x2": 93.178, "r_y2": 668.3340000000001, "r_x3": 86.533, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 97.063, "r_y0": 676.886, "r_x1": 123.634, "r_y1": 676.886, "r_x2": 123.634, "r_y2": 668.3340000000001, "r_x3": 97.063, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "one of", "orig": "one of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 127.519, "r_y0": 676.58, "r_x1": 132.5, "r_y1": 676.58, "r_x2": 132.5, "r_y2": 668.016, "r_x3": 127.519, "r_y3": 668.016, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.501, "r_y0": 676.886, "r_x1": 148.272, "r_y1": 676.886, "r_x2": 148.272, "r_y2": 668.3340000000001, "r_x3": 132.501, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "left,", "orig": "left,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.506, "r_y0": 676.886, "r_x1": 187.644, "r_y1": 676.886, "r_x2": 187.644, "r_y2": 668.3340000000001, "r_x3": 152.506, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "centroid,", "orig": "centroid,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 191.878, "r_y0": 676.886, "r_x1": 210.697, "r_y1": 676.886, "r_x2": 210.697, "r_y2": 668.3340000000001, "r_x3": 191.878, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "right", "orig": "right", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.697, "r_y0": 676.58, "r_x1": 215.678, "r_y1": 676.58, "r_x2": 215.678, "r_y2": 668.016, "r_x3": 210.697, "r_y3": 668.016, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.563, "r_y0": 676.886, "r_x1": 233.949, "r_y1": 676.886, "r_x2": 233.949, "r_y2": 668.3340000000001, "r_x3": 219.563, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 237.835, "r_y0": 676.722, "r_x1": 243.529, "r_y1": 676.722, "r_x2": 243.529, "r_y2": 668.016, "r_x3": 237.835, "r_y3": 668.016, "coord_origin": "TOPLEFT"}, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.529, "r_y0": 677.645, "r_x1": 247.089, "r_y1": 677.645, "r_x2": 247.089, "r_y2": 671.551, "r_x3": 243.529, "r_y3": 671.551, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.473, "r_y0": 676.886, "r_x1": 258.118, "r_y1": 676.886, "r_x2": 258.118, "r_y2": 668.3340000000001, "r_x3": 251.473, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.003, "r_y0": 676.886, "r_x1": 286.362, "r_y1": 676.886, "r_x2": 286.362, "r_y2": 668.3340000000001, "r_x3": 262.003, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "the x-", "orig": "the x-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 688.841, "r_x1": 205.887, "r_y1": 688.841, "r_x2": 205.887, "r_y2": 680.289, "r_x3": 50.112, "r_y3": 680.289, "coord_origin": "TOPLEFT"}, "text": "coordinate for the corresponding point.", "orig": "coordinate for the corresponding point.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 13, "label": "list_item", "bbox": {"l": 50.112, "t": 692.559, "r": 286.365, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9260510206222534, "cells": [{"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 701.111, "r_x1": 69.539, "r_y1": 701.111, "r_x2": 69.539, "r_y2": 692.559, "r_x3": 62.067, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.274, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 76.274, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Use the alignment computed in step 4, to compute", "orig": "Use the alignment computed in step 4, to compute", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 94.605, "r_y1": 713.066, "r_x2": 94.605, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "the median", "orig": "the median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 97.599, "r_y0": 712.902, "r_x1": 103.293, "r_y1": 712.902, "r_x2": 103.293, "r_y2": 704.196, "r_x3": 97.599, "r_y3": 704.196, "coord_origin": "TOPLEFT"}, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.292, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 103.292, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "-coordinate for all table columns and the me-", "orig": "-coordinate for all table columns and the me-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 16, "label": "text", "bbox": {"l": 308.862, "t": 211.20000000000005, "r": 545.115, "b": 255.61800000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.8942298889160156, "cells": [{"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 219.75199999999995, "r_x1": 435.915, "r_y1": 219.75199999999995, "r_x2": 435.915, "r_y2": 211.20000000000005, "r_x3": 308.862, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "dian cell size for all table cells.", "orig": "dian cell size for all table cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.697, "r_y0": 219.75199999999995, "r_x1": 545.115, "r_y1": 219.75199999999995, "r_x2": 545.115, "r_y2": 211.20000000000005, "r_x3": 440.697, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "The usage of median dur-", "orig": "The usage of median dur-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 231.70799999999997, "r_x1": 545.115, "r_y1": 231.70799999999997, "r_x2": 545.115, "r_y2": 223.15599999999995, "r_x3": 308.862, "r_y3": 223.15599999999995, "coord_origin": "TOPLEFT"}, "text": "ing the computations, helps to eliminate outliers caused by", "orig": "ing the computations, helps to eliminate outliers caused by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 243.663, "r_x1": 545.115, "r_y1": 243.663, "r_x2": 545.115, "r_y2": 235.111, "r_x3": 308.862, "r_y3": 235.111, "coord_origin": "TOPLEFT"}, "text": "occasional column spans which are usually wider than the", "orig": "occasional column spans which are usually wider than the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 255.61800000000005, "r_x1": 339.577, "r_y1": 255.61800000000005, "r_x2": 339.577, "r_y2": 247.06600000000003, "r_x3": 308.862, "r_y3": 247.06600000000003, "coord_origin": "TOPLEFT"}, "text": "normal.", "orig": "normal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 9, "label": "list_item", "bbox": {"l": 308.862, "t": 259.371, "r": 545.115, "b": 279.87800000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9423392415046692, "cells": [{"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 267.923, "r_x1": 328.289, "r_y1": 267.923, "r_x2": 328.289, "r_y2": 259.371, "r_x3": 320.817, "r_y3": 259.371, "coord_origin": "TOPLEFT"}, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.884, "r_y0": 267.923, "r_x1": 545.115, "r_y1": 267.923, "r_x2": 545.115, "r_y2": 259.371, "r_x3": 334.884, "r_y3": 259.371, "coord_origin": "TOPLEFT"}, "text": "Snap all cells with bad IOU to their corresponding", "orig": "Snap all cells with bad IOU to their corresponding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 279.87800000000004, "r_x1": 338.192, "r_y1": 279.87800000000004, "r_x2": 338.192, "r_y2": 271.326, "r_x3": 308.862, "r_y3": 271.326, "coord_origin": "TOPLEFT"}, "text": "median", "orig": "median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.682, "r_y0": 279.71400000000006, "r_x1": 346.376, "r_y1": 279.71400000000006, "r_x2": 346.376, "r_y2": 271.00800000000004, "r_x3": 340.682, "r_y3": 271.00800000000004, "coord_origin": "TOPLEFT"}, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.376, "r_y0": 279.87800000000004, "r_x1": 453.723, "r_y1": 279.87800000000004, "r_x2": 453.723, "r_y2": 271.326, "r_x3": 346.376, "r_y3": 271.326, "coord_origin": "TOPLEFT"}, "text": "-coordinates and cell sizes.", "orig": "-coordinates and cell sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 6, "label": "list_item", "bbox": {"l": 308.862, "t": 283.632, "r": 545.115, "b": 387.825, "coord_origin": "TOPLEFT"}, "confidence": 0.9562004804611206, "cells": [{"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 292.184, "r_x1": 328.289, "r_y1": 292.184, "r_x2": 328.289, "r_y2": 283.632, "r_x3": 320.817, "r_y3": 283.632, "coord_origin": "TOPLEFT"}, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.144, "r_y0": 292.184, "r_x1": 545.115, "r_y1": 292.184, "r_x2": 545.115, "r_y2": 283.632, "r_x3": 332.144, "r_y3": 283.632, "coord_origin": "TOPLEFT"}, "text": "Generate a new set of pair-wise matches between the", "orig": "Generate a new set of pair-wise matches between the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 304.139, "r_x1": 476.562, "r_y1": 304.139, "r_x2": 476.562, "r_y2": 295.587, "r_x3": 308.862, "r_y3": 295.587, "coord_origin": "TOPLEFT"}, "text": "corrected bounding boxes and PDF cells.", "orig": "corrected bounding boxes and PDF cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 482.082, "r_y0": 304.139, "r_x1": 545.115, "r_y1": 304.139, "r_x2": 545.115, "r_y2": 295.587, "r_x3": 482.082, "r_y3": 295.587, "coord_origin": "TOPLEFT"}, "text": "This time use a", "orig": "This time use a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 316.094, "r_x1": 545.115, "r_y1": 316.094, "r_x2": 545.115, "r_y2": 307.542, "r_x3": 308.862, "r_y3": 307.542, "coord_origin": "TOPLEFT"}, "text": "modified version of the IOU metric, where the area of the", "orig": "modified version of the IOU metric, where the area of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 328.049, "r_x1": 545.115, "r_y1": 328.049, "r_x2": 545.115, "r_y2": 319.497, "r_x3": 308.862, "r_y3": 319.497, "coord_origin": "TOPLEFT"}, "text": "intersection between the predicted and PDF cells is divided", "orig": "intersection between the predicted and PDF cells is divided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 340.005, "r_x1": 397.19, "r_y1": 340.005, "r_x2": 397.19, "r_y2": 331.453, "r_x3": 308.862, "r_y3": 331.453, "coord_origin": "TOPLEFT"}, "text": "by the PDF cell area.", "orig": "by the PDF cell area.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 403.656, "r_y0": 340.005, "r_x1": 545.115, "r_y1": 340.005, "r_x2": 545.115, "r_y2": 331.453, "r_x3": 403.656, "r_y3": 331.453, "coord_origin": "TOPLEFT"}, "text": "In case there are multiple matches", "orig": "In case there are multiple matches", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 351.96, "r_x1": 545.115, "r_y1": 351.96, "r_x2": 545.115, "r_y2": 343.408, "r_x3": 308.862, "r_y3": 343.408, "coord_origin": "TOPLEFT"}, "text": "for the same PDF cell, the prediction with the higher score", "orig": "for the same PDF cell, the prediction with the higher score", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 363.915, "r_x1": 357.26, "r_y1": 363.915, "r_x2": 357.26, "r_y2": 355.363, "r_x3": 308.862, "r_y3": 355.363, "coord_origin": "TOPLEFT"}, "text": "is preferred.", "orig": "is preferred.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 361.176, "r_y0": 363.915, "r_x1": 545.115, "r_y1": 363.915, "r_x2": 545.115, "r_y2": 355.363, "r_x3": 361.176, "r_y3": 355.363, "coord_origin": "TOPLEFT"}, "text": "This covers the cases where the PDF cells are", "orig": "This covers the cases where the PDF cells are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 375.87, "r_x1": 545.115, "r_y1": 375.87, "r_x2": 545.115, "r_y2": 367.318, "r_x3": 308.862, "r_y3": 367.318, "coord_origin": "TOPLEFT"}, "text": "smaller than the area of predicted or corrected prediction", "orig": "smaller than the area of predicted or corrected prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 387.825, "r_x1": 329.614, "r_y1": 387.825, "r_x2": 329.614, "r_y2": 379.273, "r_x3": 308.862, "r_y3": 379.273, "coord_origin": "TOPLEFT"}, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "list_item", "bbox": {"l": 308.862, "t": 391.579, "r": 545.115, "b": 459.906, "coord_origin": "TOPLEFT"}, "confidence": 0.8719939589500427, "cells": [{"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 400.131, "r_x1": 328.289, "r_y1": 400.131, "r_x2": 328.289, "r_y2": 391.579, "r_x3": 320.817, "r_y3": 391.579, "coord_origin": "TOPLEFT"}, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.569, "r_y0": 400.131, "r_x1": 545.115, "r_y1": 400.131, "r_x2": 545.115, "r_y2": 391.579, "r_x3": 333.569, "r_y3": 391.579, "coord_origin": "TOPLEFT"}, "text": "In some rare occasions, we have noticed that Table-", "orig": "In some rare occasions, we have noticed that Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 412.086, "r_x1": 545.115, "r_y1": 412.086, "r_x2": 545.115, "r_y2": 403.534, "r_x3": 308.862, "r_y3": 403.534, "coord_origin": "TOPLEFT"}, "text": "Former can confuse a single column as two. When the post-", "orig": "Former can confuse a single column as two. When the post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 424.041, "r_x1": 545.115, "r_y1": 424.041, "r_x2": 545.115, "r_y2": 415.489, "r_x3": 308.862, "r_y3": 415.489, "coord_origin": "TOPLEFT"}, "text": "processing steps are applied, this results with two predicted", "orig": "processing steps are applied, this results with two predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 435.996, "r_x1": 488.109, "r_y1": 435.996, "r_x2": 488.109, "r_y2": 427.444, "r_x3": 308.862, "r_y3": 427.444, "coord_origin": "TOPLEFT"}, "text": "columns pointing to the same PDF column.", "orig": "columns pointing to the same PDF column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 494.336, "r_y0": 435.996, "r_x1": 545.115, "r_y1": 435.996, "r_x2": 545.115, "r_y2": 427.444, "r_x3": 494.336, "r_y3": 427.444, "coord_origin": "TOPLEFT"}, "text": "In such case", "orig": "In such case", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 447.951, "r_x1": 545.115, "r_y1": 447.951, "r_x2": 545.115, "r_y2": 439.399, "r_x3": 308.862, "r_y3": 439.399, "coord_origin": "TOPLEFT"}, "text": "we must de-duplicate the columns according to highest to-", "orig": "we must de-duplicate the columns according to highest to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 459.906, "r_x1": 426.182, "r_y1": 459.906, "r_x2": 426.182, "r_y2": 451.354, "r_x3": 308.862, "r_y3": 451.354, "coord_origin": "TOPLEFT"}, "text": "tal column intersection score.", "orig": "tal column intersection score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 15, "label": "list_item", "bbox": {"l": 308.862, "t": 463.66, "r": 545.115, "b": 567.8530000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9126082062721252, "cells": [{"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 472.212, "r_x1": 328.289, "r_y1": 472.212, "r_x2": 328.289, "r_y2": 463.66, "r_x3": 320.817, "r_y3": 463.66, "coord_origin": "TOPLEFT"}, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.629, "r_y0": 472.212, "r_x1": 478.505, "r_y1": 472.212, "r_x2": 478.505, "r_y2": 463.66, "r_x3": 333.629, "r_y3": 463.66, "coord_origin": "TOPLEFT"}, "text": "Pick up the remaining orphan cells.", "orig": "Pick up the remaining orphan cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.855, "r_y0": 472.212, "r_x1": 545.115, "r_y1": 472.212, "r_x2": 545.115, "r_y2": 463.66, "r_x3": 483.855, "r_y3": 463.66, "coord_origin": "TOPLEFT"}, "text": "There could be", "orig": "There could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 484.167, "r_x1": 545.115, "r_y1": 484.167, "r_x2": 545.115, "r_y2": 475.615, "r_x3": 308.862, "r_y3": 475.615, "coord_origin": "TOPLEFT"}, "text": "cases, when after applying all the previous post-processing", "orig": "cases, when after applying all the previous post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 496.122, "r_x1": 545.115, "r_y1": 496.122, "r_x2": 545.115, "r_y2": 487.57, "r_x3": 308.862, "r_y3": 487.57, "coord_origin": "TOPLEFT"}, "text": "steps, some PDF cells could still remain without any match", "orig": "steps, some PDF cells could still remain without any match", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 508.077, "r_x1": 381.898, "r_y1": 508.077, "r_x2": 381.898, "r_y2": 499.525, "r_x3": 308.862, "r_y3": 499.525, "coord_origin": "TOPLEFT"}, "text": "to predicted cells.", "orig": "to predicted cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 388.702, "r_y0": 508.077, "r_x1": 545.115, "r_y1": 508.077, "r_x2": 545.115, "r_y2": 499.525, "r_x3": 388.702, "r_y3": 499.525, "coord_origin": "TOPLEFT"}, "text": "However, it is still possible to deduce", "orig": "However, it is still possible to deduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 520.033, "r_x1": 545.115, "r_y1": 520.033, "r_x2": 545.115, "r_y2": 511.481, "r_x3": 308.862, "r_y3": 511.481, "coord_origin": "TOPLEFT"}, "text": "the correct matching for an orphan PDF cell by mapping its", "orig": "the correct matching for an orphan PDF cell by mapping its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 531.988, "r_x1": 483.576, "r_y1": 531.988, "r_x2": 483.576, "r_y2": 523.4359999999999, "r_x3": 308.862, "r_y3": 523.4359999999999, "coord_origin": "TOPLEFT"}, "text": "bounding box on the geometry of the grid.", "orig": "bounding box on the geometry of the grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.195, "r_y0": 531.988, "r_x1": 545.115, "r_y1": 531.988, "r_x2": 545.115, "r_y2": 523.4359999999999, "r_x3": 489.195, "r_y3": 523.4359999999999, "coord_origin": "TOPLEFT"}, "text": "This mapping", "orig": "This mapping", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 543.943, "r_x1": 545.115, "r_y1": 543.943, "r_x2": 545.115, "r_y2": 535.3910000000001, "r_x3": 308.862, "r_y3": 535.3910000000001, "coord_origin": "TOPLEFT"}, "text": "decides if the content of the orphan cell will be appended to", "orig": "decides if the content of the orphan cell will be appended to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 555.898, "r_x1": 545.115, "r_y1": 555.898, "r_x2": 545.115, "r_y2": 547.346, "r_x3": 308.862, "r_y3": 547.346, "coord_origin": "TOPLEFT"}, "text": "an already matched table cell, or a new table cell should be", "orig": "an already matched table cell, or a new table cell should be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 567.8530000000001, "r_x1": 442.221, "r_y1": 567.8530000000001, "r_x2": 442.221, "r_y2": 559.3009999999999, "r_x3": 308.862, "r_y3": 559.3009999999999, "coord_origin": "TOPLEFT"}, "text": "created to match with the orphan.", "orig": "created to match with the orphan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 19, "label": "text", "bbox": {"l": 308.862, "t": 571.607, "r": 545.117, "b": 604.069, "coord_origin": "TOPLEFT"}, "confidence": 0.8459473848342896, "cells": [{"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 580.159, "r_x1": 332.712, "r_y1": 580.159, "r_x2": 332.712, "r_y2": 571.607, "r_x3": 320.817, "r_y3": 571.607, "coord_origin": "TOPLEFT"}, "text": "9a.", "orig": "9a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.943, "r_y0": 580.159, "r_x1": 545.115, "r_y1": 580.159, "r_x2": 545.115, "r_y2": 571.607, "r_x3": 337.943, "r_y3": 571.607, "coord_origin": "TOPLEFT"}, "text": "Compute the top and bottom boundary of the hori-", "orig": "Compute the top and bottom boundary of the hori-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 592.114, "r_x1": 471.641, "r_y1": 592.114, "r_x2": 471.641, "r_y2": 583.562, "r_x3": 308.862, "r_y3": 583.562, "coord_origin": "TOPLEFT"}, "text": "zontal band for each grid row (min/max", "orig": "zontal band for each grid row (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 474.834, "r_y0": 591.95, "r_x1": 479.719, "r_y1": 591.95, "r_x2": 479.719, "r_y2": 583.244, "r_x3": 474.834, "r_y3": 583.244, "coord_origin": "TOPLEFT"}, "text": "y", "orig": "y", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.269, "r_y0": 592.114, "r_x1": 545.117, "r_y1": 592.114, "r_x2": 545.117, "r_y2": 583.562, "r_x3": 483.269, "r_y3": 583.562, "coord_origin": "TOPLEFT"}, "text": "coordinates per", "orig": "coordinates per", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 604.069, "r_x1": 329.913, "r_y1": 604.069, "r_x2": 329.913, "r_y2": 595.517, "r_x3": 308.862, "r_y3": 595.517, "coord_origin": "TOPLEFT"}, "text": "row).", "orig": "row).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 21, "label": "list_item", "bbox": {"l": 308.862, "t": 607.822, "r": 545.115, "b": 628.33, "coord_origin": "TOPLEFT"}, "confidence": 0.7716891169548035, "cells": [{"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 616.374, "r_x1": 332.872, "r_y1": 616.374, "r_x2": 332.872, "r_y2": 607.822, "r_x3": 320.817, "r_y3": 607.822, "coord_origin": "TOPLEFT"}, "text": "9b.", "orig": "9b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.925, "r_y0": 616.374, "r_x1": 374.226, "r_y1": 616.374, "r_x2": 374.226, "r_y2": 607.822, "r_x3": 339.925, "r_y3": 607.822, "coord_origin": "TOPLEFT"}, "text": "Intersect", "orig": "Intersect", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 378.042, "r_y0": 616.374, "r_x1": 545.115, "r_y1": 616.374, "r_x2": 545.115, "r_y2": 607.822, "r_x3": 378.042, "r_y3": 607.822, "coord_origin": "TOPLEFT"}, "text": "the orphan's bounding box with the row", "orig": "the orphan's bounding box with the row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 628.33, "r_x1": 495.292, "r_y1": 628.33, "r_x2": 495.292, "r_y2": 619.778, "r_x3": 308.862, "r_y3": 619.778, "coord_origin": "TOPLEFT"}, "text": "bands, and map the cell to the closest grid row.", "orig": "bands, and map the cell to the closest grid row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 18, "label": "list_item", "bbox": {"l": 308.862, "t": 632.083, "r": 545.115, "b": 664.545, "coord_origin": "TOPLEFT"}, "confidence": 0.8584907054901123, "cells": [{"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 640.635, "r_x1": 332.712, "r_y1": 640.635, "r_x2": 332.712, "r_y2": 632.083, "r_x3": 320.817, "r_y3": 632.083, "coord_origin": "TOPLEFT"}, "text": "9c.", "orig": "9c.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.534, "r_y0": 640.635, "r_x1": 545.115, "r_y1": 640.635, "r_x2": 545.115, "r_y2": 632.083, "r_x3": 337.534, "r_y3": 632.083, "coord_origin": "TOPLEFT"}, "text": "Compute the left and right boundary of the vertical", "orig": "Compute the left and right boundary of the vertical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 652.59, "r_x1": 455.282, "r_y1": 652.59, "r_x2": 455.282, "r_y2": 644.038, "r_x3": 308.862, "r_y3": 644.038, "coord_origin": "TOPLEFT"}, "text": "band for each grid column (min/max", "orig": "band for each grid column (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 457.777, "r_y0": 652.4259999999999, "r_x1": 463.471, "r_y1": 652.4259999999999, "r_x2": 463.471, "r_y2": 643.72, "r_x3": 457.777, "r_y3": 643.72, "coord_origin": "TOPLEFT"}, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.971, "r_y0": 652.59, "r_x1": 545.114, "r_y1": 652.59, "r_x2": 545.114, "r_y2": 644.038, "r_x3": 465.971, "r_y3": 644.038, "coord_origin": "TOPLEFT"}, "text": "coordinates per col-", "orig": "coordinates per col-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 664.545, "r_x1": 332.384, "r_y1": 664.545, "r_x2": 332.384, "r_y2": 655.9929999999999, "r_x3": 308.862, "r_y3": 655.9929999999999, "coord_origin": "TOPLEFT"}, "text": "umn).", "orig": "umn).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 22, "label": "list_item", "bbox": {"l": 308.862, "t": 668.299, "r": 545.115, "b": 688.806, "coord_origin": "TOPLEFT"}, "confidence": 0.7590745091438293, "cells": [{"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 676.851, "r_x1": 545.115, "r_y1": 676.851, "r_x2": 545.115, "r_y2": 668.299, "r_x3": 320.817, "r_y3": 668.299, "coord_origin": "TOPLEFT"}, "text": "9d. Intersect the orphan's bounding box with the column", "orig": "9d. Intersect the orphan's bounding box with the column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 688.806, "r_x1": 510.585, "r_y1": 688.806, "r_x2": 510.585, "r_y2": 680.254, "r_x3": 308.862, "r_y3": 680.254, "coord_origin": "TOPLEFT"}, "text": "bands, and map the cell to the closest grid column.", "orig": "bands, and map the cell to the closest grid column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 25, "label": "list_item", "bbox": {"l": 308.862, "t": 692.559, "r": 545.115, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.6971189975738525, "cells": [{"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 320.817, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "9e. If the table cell under the identified row and column", "orig": "9e. If the table cell under the identified row and column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "is not empty, extend its content with the content of the or-", "orig": "is not empty, extend its content with the content of the or-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 14, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9126598238945007, "cells": [{"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "picture", "id": 30, "page_no": 11, "cluster": {"id": 30, "label": "picture", "bbox": {"l": 53.54227066040039, "t": 74.74854278564453, "r": 544.938232421875, "b": 147.59091186523438, "coord_origin": "TOPLEFT"}, "confidence": 0.6033818125724792, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.391, "r_y0": 83.19600000000003, "r_x1": 151.946, "r_y1": 83.19600000000003, "r_x2": 151.946, "r_y2": 77.543, "r_x3": 119.391, "r_y3": 77.543, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.346, "r_y0": 81.077, "r_x1": 59.327, "r_y1": 81.077, "r_x2": 59.327, "r_y2": 75.42399999999998, "r_x3": 53.346, "r_y3": 75.42399999999998, "coord_origin": "TOPLEFT"}, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.579, "r_y0": 83.34400000000005, "r_x1": 319.827, "r_y1": 83.34400000000005, "r_x2": 319.827, "r_y2": 77.69100000000003, "r_x3": 289.579, "r_y3": 77.69100000000003, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.373, "r_y0": 83.13999999999999, "r_x1": 481.759, "r_y1": 83.13999999999999, "r_x2": 481.759, "r_y2": 77.48699999999997, "r_x3": 448.373, "r_y3": 77.48699999999997, "coord_origin": "TOPLEFT"}, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.553, "r_y0": 146.18100000000004, "r_x1": 105.08, "r_y1": 146.18100000000004, "r_x2": 105.08, "r_y2": 141.47000000000003, "r_x3": 82.553, "r_y3": 141.47000000000003, "coord_origin": "TOPLEFT"}, "text": "Train Val", "orig": "Train Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 63.039, "r_y0": 106.00900000000001, "r_x1": 85.29, "r_y1": 106.00900000000001, "r_x2": 85.29, "r_y2": 101.298, "r_x3": 63.039, "r_y3": 101.298, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 67.768, "r_y0": 129.29999999999995, "r_x1": 85.231, "r_y1": 129.29999999999995, "r_x2": 85.231, "r_y2": 124.58900000000006, "r_x3": 67.768, "r_y3": 124.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.551, "r_y0": 107.44500000000005, "r_x1": 249.803, "r_y1": 107.44500000000005, "r_x2": 249.803, "r_y2": 102.73400000000004, "r_x3": 227.551, "r_y3": 102.73400000000004, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.199, "r_y0": 131.89099999999996, "r_x1": 249.662, "r_y1": 131.89099999999996, "r_x2": 249.662, "r_y2": 127.17999999999995, "r_x3": 232.199, "r_y3": 127.17999999999995, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.234, "r_y0": 118.95000000000005, "r_x1": 413.697, "r_y1": 118.95000000000005, "r_x2": 413.697, "r_y2": 114.23900000000003, "r_x3": 396.234, "r_y3": 114.23900000000003, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.938, "r_y0": 90.63800000000003, "r_x1": 76.151, "r_y1": 90.63800000000003, "r_x2": 76.151, "r_y2": 85.92700000000002, "r_x3": 60.938, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.305, "r_y0": 91.12800000000004, "r_x1": 106.992, "r_y1": 91.10699999999997, "r_x2": 106.992, "r_y2": 86.39599999999996, "r_x3": 82.305, "r_y3": 86.41700000000003, "coord_origin": "TOPLEFT"}, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.205, "r_y0": 146.51099999999997, "r_x1": 271.386, "r_y1": 146.51099999999997, "r_x2": 271.386, "r_y2": 141.79999999999995, "r_x3": 246.205, "r_y3": 141.79999999999995, "coord_origin": "TOPLEFT"}, "text": "Train Test", "orig": "Train Test", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.182, "r_y0": 146.51099999999997, "r_x1": 281.88, "r_y1": 146.51099999999997, "r_x2": 281.88, "r_y2": 141.79999999999995, "r_x3": 274.182, "r_y3": 141.79999999999995, "coord_origin": "TOPLEFT"}, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 226.698, "r_y0": 90.63800000000003, "r_x1": 241.912, "r_y1": 90.63800000000003, "r_x2": 241.912, "r_y2": 85.92700000000002, "r_x3": 226.698, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.939, "r_y0": 90.99300000000005, "r_x1": 282.494, "r_y1": 91.0, "r_x2": 282.494, "r_y2": 86.28899999999999, "r_x3": 249.939, "r_y3": 86.28200000000004, "coord_origin": "TOPLEFT"}, "text": "91K 10K10K", "orig": "91K 10K10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.194, "r_y0": 146.18100000000004, "r_x1": 434.278, "r_y1": 146.32799999999997, "r_x2": 434.278, "r_y2": 141.61699999999996, "r_x3": 410.194, "r_y3": 141.47000000000003, "coord_origin": "TOPLEFT"}, "text": "Train Test", "orig": "Train Test", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.991, "r_y0": 146.32799999999997, "r_x1": 444.689, "r_y1": 146.32799999999997, "r_x2": 444.689, "r_y2": 141.61699999999996, "r_x3": 436.991, "r_y3": 141.61699999999996, "coord_origin": "TOPLEFT"}, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.373, "r_y0": 90.63800000000003, "r_x1": 406.587, "r_y1": 90.63800000000003, "r_x2": 406.587, "r_y2": 85.92700000000002, "r_x3": 391.373, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.521, "r_y0": 91.12800000000004, "r_x1": 445.624, "r_y1": 91.16600000000005, "r_x2": 445.624, "r_y2": 86.45500000000004, "r_x3": 410.521, "r_y3": 86.41700000000003, "coord_origin": "TOPLEFT"}, "text": "130K 5K 10K", "orig": "130K 5K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.949, "r_y0": 146.19299999999998, "r_x1": 156.042, "r_y1": 146.341, "r_x2": 156.042, "r_y2": 141.63, "r_x3": 113.949, "r_y3": 141.48199999999997, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.916, "r_y0": 99.72299999999996, "r_x1": 127.054, "r_y1": 99.72299999999996, "r_x2": 127.054, "r_y2": 95.01199999999994, "r_x3": 116.916, "r_y3": 95.01199999999994, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.315, "r_y0": 105.84299999999996, "r_x1": 127.053, "r_y1": 105.84299999999996, "r_x2": 127.053, "r_y2": 101.13199999999995, "r_x3": 113.315, "r_y3": 101.13199999999995, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.941, "r_y0": 111.96299999999997, "r_x1": 127.055, "r_y1": 111.96299999999997, "r_x2": 127.055, "r_y2": 107.25199999999995, "r_x3": 112.941, "r_y3": 107.25199999999995, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.227, "r_y0": 127.51999999999998, "r_x1": 126.966, "r_y1": 127.51999999999998, "r_x2": 126.966, "r_y2": 122.80899999999997, "r_x3": 113.227, "r_y3": 122.80899999999997, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.854, "r_y0": 133.64, "r_x1": 126.968, "r_y1": 133.64, "r_x2": 126.968, "r_y2": 128.92899999999997, "r_x3": 112.854, "r_y3": 128.92899999999997, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.031, "r_y0": 91.17600000000004, "r_x1": 151.042, "r_y1": 91.17100000000005, "r_x2": 151.042, "r_y2": 86.46000000000004, "r_x3": 122.031, "r_y3": 86.46500000000003, "coord_origin": "TOPLEFT"}, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 311.654, "r_y0": 91.46000000000004, "r_x1": 321.672, "r_y1": 91.46000000000004, "r_x2": 321.672, "r_y2": 86.74900000000002, "r_x3": 311.654, "r_y3": 86.74900000000002, "coord_origin": "TOPLEFT"}, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 287.894, "r_y0": 146.615, "r_x1": 328.809, "r_y1": 146.615, "r_x2": 328.809, "r_y2": 141.904, "r_x3": 287.894, "r_y3": 141.904, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.236, "r_y0": 97.98500000000001, "r_x1": 299.375, "r_y1": 97.98500000000001, "r_x2": 299.375, "r_y2": 93.274, "r_x3": 289.236, "r_y3": 93.274, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.635, "r_y0": 104.10500000000002, "r_x1": 299.373, "r_y1": 104.10500000000002, "r_x2": 299.373, "r_y2": 99.394, "r_x3": 285.635, "r_y3": 99.394, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.261, "r_y0": 110.22500000000002, "r_x1": 299.375, "r_y1": 110.22500000000002, "r_x2": 299.375, "r_y2": 105.51400000000001, "r_x3": 285.261, "r_y3": 105.51400000000001, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.431, "r_y0": 125.29499999999996, "r_x1": 299.169, "r_y1": 125.29499999999996, "r_x2": 299.169, "r_y2": 120.58399999999995, "r_x3": 285.431, "r_y3": 120.58399999999995, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.057, "r_y0": 131.41499999999996, "r_x1": 299.171, "r_y1": 131.41499999999996, "r_x2": 299.171, "r_y2": 126.70399999999995, "r_x3": 285.057, "r_y3": 126.70399999999995, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 299.584, "r_y0": 91.59799999999996, "r_x1": 309.602, "r_y1": 91.59799999999996, "r_x2": 309.602, "r_y2": 86.88699999999994, "r_x3": 299.584, "r_y3": 86.88699999999994, "coord_origin": "TOPLEFT"}, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.041, "r_y0": 146.57600000000002, "r_x1": 483.504, "r_y1": 146.57600000000002, "r_x2": 483.504, "r_y2": 141.86599999999999, "r_x3": 466.041, "r_y3": 141.86599999999999, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.022, "r_y0": 98.66600000000005, "r_x1": 469.16, "r_y1": 98.66600000000005, "r_x2": 469.16, "r_y2": 93.95500000000004, "r_x3": 459.022, "r_y3": 93.95500000000004, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.421, "r_y0": 104.78599999999994, "r_x1": 469.159, "r_y1": 104.78599999999994, "r_x2": 469.159, "r_y2": 100.07500000000005, "r_x3": 455.421, "r_y3": 100.07500000000005, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.047, "r_y0": 110.90599999999995, "r_x1": 469.161, "r_y1": 110.90599999999995, "r_x2": 469.161, "r_y2": 106.19500000000005, "r_x3": 455.047, "r_y3": 106.19500000000005, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 467.394, "r_y0": 90.47699999999998, "r_x1": 480.655, "r_y1": 90.47699999999998, "r_x2": 480.655, "r_y2": 85.76599999999996, "r_x3": 467.394, "r_y3": 85.76599999999996, "coord_origin": "TOPLEFT"}, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.377, "r_y0": 146.48900000000003, "r_x1": 202.841, "r_y1": 146.61599999999999, "r_x2": 202.841, "r_y2": 141.90499999999997, "r_x3": 160.377, "r_y3": 141.77800000000002, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.743, "r_y0": 99.76999999999998, "r_x1": 173.327, "r_y1": 99.76999999999998, "r_x2": 173.327, "r_y2": 95.05899999999997, "r_x3": 153.743, "r_y3": 95.05899999999997, "coord_origin": "TOPLEFT"}, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.51, "r_y0": 105.88999999999999, "r_x1": 173.325, "r_y1": 105.88999999999999, "r_x2": 173.325, "r_y2": 101.17899999999997, "r_x3": 154.51, "r_y3": 101.17899999999997, "coord_origin": "TOPLEFT"}, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.272, "r_y0": 112.00999999999999, "r_x1": 173.327, "r_y1": 112.00999999999999, "r_x2": 173.327, "r_y2": 107.29899999999998, "r_x3": 155.272, "r_y3": 107.29899999999998, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.413, "r_y0": 112.13699999999994, "r_x1": 345.997, "r_y1": 112.13699999999994, "r_x2": 345.997, "r_y2": 107.42600000000004, "r_x3": 326.413, "r_y3": 107.42600000000004, "coord_origin": "TOPLEFT"}, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.18, "r_y0": 118.25699999999995, "r_x1": 345.995, "r_y1": 118.25699999999995, "r_x2": 345.995, "r_y2": 113.54600000000005, "r_x3": 327.18, "r_y3": 113.54600000000005, "coord_origin": "TOPLEFT"}, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.941, "r_y0": 124.37699999999995, "r_x1": 345.996, "r_y1": 124.37699999999995, "r_x2": 345.996, "r_y2": 119.66600000000005, "r_x3": 327.941, "r_y3": 119.66600000000005, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.994, "r_y0": 109.05899999999997, "r_x1": 508.764, "r_y1": 109.05899999999997, "r_x2": 508.764, "r_y2": 104.34799999999996, "r_x3": 488.994, "r_y3": 104.34799999999996, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.189, "r_y0": 115.17899999999997, "r_x1": 508.764, "r_y1": 115.17899999999997, "r_x2": 508.764, "r_y2": 110.46799999999996, "r_x3": 490.189, "r_y3": 110.46799999999996, "coord_origin": "TOPLEFT"}, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.72, "r_y0": 121.29899999999998, "r_x1": 508.768, "r_y1": 121.29899999999998, "r_x2": 508.768, "r_y2": 116.58799999999997, "r_x3": 489.72, "r_y3": 116.58799999999997, "coord_origin": "TOPLEFT"}, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.711, "r_y0": 127.41899999999998, "r_x1": 508.766, "r_y1": 127.41899999999998, "r_x2": 508.766, "r_y2": 122.70799999999997, "r_x3": 490.711, "r_y3": 122.70799999999997, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.504, "r_y0": 91.04100000000005, "r_x1": 197.527, "r_y1": 91.0, "r_x2": 197.527, "r_y2": 86.28899999999999, "r_x3": 168.504, "r_y3": 86.33000000000004, "coord_origin": "TOPLEFT"}, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.377, "r_y0": 90.90200000000004, "r_x1": 367.395, "r_y1": 90.90200000000004, "r_x2": 367.395, "r_y2": 86.19100000000003, "r_x3": 357.377, "r_y3": 86.19100000000003, "coord_origin": "TOPLEFT"}, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.732, "r_y0": 146.52800000000002, "r_x1": 374.929, "r_y1": 146.52800000000002, "r_x2": 374.929, "r_y2": 141.817, "r_x3": 333.732, "r_y3": 141.817, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.691, "r_y0": 90.96100000000001, "r_x1": 355.709, "r_y1": 90.96100000000001, "r_x2": 355.709, "r_y2": 86.25, "r_x3": 345.691, "r_y3": 86.25, "coord_origin": "TOPLEFT"}, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 508.543, "r_y0": 146.28200000000004, "r_x1": 526.006, "r_y1": 146.28200000000004, "r_x2": 526.006, "r_y2": 141.57100000000003, "r_x3": 508.543, "r_y3": 141.57100000000003, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 510.447, "r_y0": 90.99699999999996, "r_x1": 523.707, "r_y1": 90.99699999999996, "r_x2": 523.707, "r_y2": 86.28599999999994, "r_x3": 510.447, "r_y3": 86.28599999999994, "coord_origin": "TOPLEFT"}, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 46, "label": "text", "bbox": {"l": 119.391, "t": 77.543, "r": 151.946, "b": 83.19600000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.391, "r_y0": 83.19600000000003, "r_x1": 151.946, "r_y1": 83.19600000000003, "r_x2": 151.946, "r_y2": 77.543, "r_x3": 119.391, "r_y3": 77.543, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 53.346, "t": 75.42399999999998, "r": 59.327, "b": 81.077, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.346, "r_y0": 81.077, "r_x1": 59.327, "r_y1": 81.077, "r_x2": 59.327, "r_y2": 75.42399999999998, "r_x3": 53.346, "r_y3": 75.42399999999998, "coord_origin": "TOPLEFT"}, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 289.579, "t": 77.69100000000003, "r": 319.827, "b": 83.34400000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.579, "r_y0": 83.34400000000005, "r_x1": 319.827, "r_y1": 83.34400000000005, "r_x2": 319.827, "r_y2": 77.69100000000003, "r_x3": 289.579, "r_y3": 77.69100000000003, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 448.373, "t": 77.48699999999997, "r": 481.759, "b": 83.13999999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.373, "r_y0": 83.13999999999999, "r_x1": 481.759, "r_y1": 83.13999999999999, "r_x2": 481.759, "r_y2": 77.48699999999997, "r_x3": 448.373, "r_y3": 77.48699999999997, "coord_origin": "TOPLEFT"}, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 82.553, "t": 141.47000000000003, "r": 105.08, "b": 146.18100000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.553, "r_y0": 146.18100000000004, "r_x1": 105.08, "r_y1": 146.18100000000004, "r_x2": 105.08, "r_y2": 141.47000000000003, "r_x3": 82.553, "r_y3": 141.47000000000003, "coord_origin": "TOPLEFT"}, "text": "Train Val", "orig": "Train Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 63.039, "t": 101.298, "r": 85.29, "b": 106.00900000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 63.039, "r_y0": 106.00900000000001, "r_x1": 85.29, "r_y1": 106.00900000000001, "r_x2": 85.29, "r_y2": 101.298, "r_x3": 63.039, "r_y3": 101.298, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 67.768, "t": 124.58900000000006, "r": 85.231, "b": 129.29999999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 67.768, "r_y0": 129.29999999999995, "r_x1": 85.231, "r_y1": 129.29999999999995, "r_x2": 85.231, "r_y2": 124.58900000000006, "r_x3": 67.768, "r_y3": 124.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 227.551, "t": 102.73400000000004, "r": 249.803, "b": 107.44500000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.551, "r_y0": 107.44500000000005, "r_x1": 249.803, "r_y1": 107.44500000000005, "r_x2": 249.803, "r_y2": 102.73400000000004, "r_x3": 227.551, "r_y3": 102.73400000000004, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 232.199, "t": 127.17999999999995, "r": 249.662, "b": 131.89099999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.199, "r_y0": 131.89099999999996, "r_x1": 249.662, "r_y1": 131.89099999999996, "r_x2": 249.662, "r_y2": 127.17999999999995, "r_x3": 232.199, "r_y3": 127.17999999999995, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 396.234, "t": 114.23900000000003, "r": 413.697, "b": 118.95000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.234, "r_y0": 118.95000000000005, "r_x1": 413.697, "r_y1": 118.95000000000005, "r_x2": 413.697, "r_y2": 114.23900000000003, "r_x3": 396.234, "r_y3": 114.23900000000003, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 60.938, "t": 85.92700000000002, "r": 76.151, "b": 90.63800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.938, "r_y0": 90.63800000000003, "r_x1": 76.151, "r_y1": 90.63800000000003, "r_x2": 76.151, "r_y2": 85.92700000000002, "r_x3": 60.938, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 82.305, "t": 86.39599999999996, "r": 106.992, "b": 91.12800000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.305, "r_y0": 91.12800000000004, "r_x1": 106.992, "r_y1": 91.10699999999997, "r_x2": 106.992, "r_y2": 86.39599999999996, "r_x3": 82.305, "r_y3": 86.41700000000003, "coord_origin": "TOPLEFT"}, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 246.205, "t": 141.79999999999995, "r": 271.386, "b": 146.51099999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.205, "r_y0": 146.51099999999997, "r_x1": 271.386, "r_y1": 146.51099999999997, "r_x2": 271.386, "r_y2": 141.79999999999995, "r_x3": 246.205, "r_y3": 141.79999999999995, "coord_origin": "TOPLEFT"}, "text": "Train Test", "orig": "Train Test", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 274.182, "t": 141.79999999999995, "r": 281.88, "b": 146.51099999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.182, "r_y0": 146.51099999999997, "r_x1": 281.88, "r_y1": 146.51099999999997, "r_x2": 281.88, "r_y2": 141.79999999999995, "r_x3": 274.182, "r_y3": 141.79999999999995, "coord_origin": "TOPLEFT"}, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 226.698, "t": 85.92700000000002, "r": 241.912, "b": 90.63800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 226.698, "r_y0": 90.63800000000003, "r_x1": 241.912, "r_y1": 90.63800000000003, "r_x2": 241.912, "r_y2": 85.92700000000002, "r_x3": 226.698, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 249.939, "t": 86.28200000000004, "r": 282.494, "b": 91.0, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.939, "r_y0": 90.99300000000005, "r_x1": 282.494, "r_y1": 91.0, "r_x2": 282.494, "r_y2": 86.28899999999999, "r_x3": 249.939, "r_y3": 86.28200000000004, "coord_origin": "TOPLEFT"}, "text": "91K 10K10K", "orig": "91K 10K10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 410.194, "t": 141.47000000000003, "r": 434.278, "b": 146.32799999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.194, "r_y0": 146.18100000000004, "r_x1": 434.278, "r_y1": 146.32799999999997, "r_x2": 434.278, "r_y2": 141.61699999999996, "r_x3": 410.194, "r_y3": 141.47000000000003, "coord_origin": "TOPLEFT"}, "text": "Train Test", "orig": "Train Test", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 436.991, "t": 141.61699999999996, "r": 444.689, "b": 146.32799999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.991, "r_y0": 146.32799999999997, "r_x1": 444.689, "r_y1": 146.32799999999997, "r_x2": 444.689, "r_y2": 141.61699999999996, "r_x3": 436.991, "r_y3": 141.61699999999996, "coord_origin": "TOPLEFT"}, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 391.373, "t": 85.92700000000002, "r": 406.587, "b": 90.63800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.373, "r_y0": 90.63800000000003, "r_x1": 406.587, "r_y1": 90.63800000000003, "r_x2": 406.587, "r_y2": 85.92700000000002, "r_x3": 391.373, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 410.521, "t": 86.41700000000003, "r": 445.624, "b": 91.16600000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.521, "r_y0": 91.12800000000004, "r_x1": 445.624, "r_y1": 91.16600000000005, "r_x2": 445.624, "r_y2": 86.45500000000004, "r_x3": 410.521, "r_y3": 86.41700000000003, "coord_origin": "TOPLEFT"}, "text": "130K 5K 10K", "orig": "130K 5K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 113.949, "t": 141.48199999999997, "r": 156.042, "b": 146.341, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.949, "r_y0": 146.19299999999998, "r_x1": 156.042, "r_y1": 146.341, "r_x2": 156.042, "r_y2": 141.63, "r_x3": 113.949, "r_y3": 141.48199999999997, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 116.916, "t": 95.01199999999994, "r": 127.054, "b": 99.72299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.916, "r_y0": 99.72299999999996, "r_x1": 127.054, "r_y1": 99.72299999999996, "r_x2": 127.054, "r_y2": 95.01199999999994, "r_x3": 116.916, "r_y3": 95.01199999999994, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 113.315, "t": 101.13199999999995, "r": 127.053, "b": 105.84299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.315, "r_y0": 105.84299999999996, "r_x1": 127.053, "r_y1": 105.84299999999996, "r_x2": 127.053, "r_y2": 101.13199999999995, "r_x3": 113.315, "r_y3": 101.13199999999995, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 112.941, "t": 107.25199999999995, "r": 127.055, "b": 111.96299999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.941, "r_y0": 111.96299999999997, "r_x1": 127.055, "r_y1": 111.96299999999997, "r_x2": 127.055, "r_y2": 107.25199999999995, "r_x3": 112.941, "r_y3": 107.25199999999995, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 113.227, "t": 122.80899999999997, "r": 126.966, "b": 127.51999999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.227, "r_y0": 127.51999999999998, "r_x1": 126.966, "r_y1": 127.51999999999998, "r_x2": 126.966, "r_y2": 122.80899999999997, "r_x3": 113.227, "r_y3": 122.80899999999997, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 112.854, "t": 128.92899999999997, "r": 126.968, "b": 133.64, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.854, "r_y0": 133.64, "r_x1": 126.968, "r_y1": 133.64, "r_x2": 126.968, "r_y2": 128.92899999999997, "r_x3": 112.854, "r_y3": 128.92899999999997, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 122.031, "t": 86.46000000000004, "r": 151.042, "b": 91.17600000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.031, "r_y0": 91.17600000000004, "r_x1": 151.042, "r_y1": 91.17100000000005, "r_x2": 151.042, "r_y2": 86.46000000000004, "r_x3": 122.031, "r_y3": 86.46500000000003, "coord_origin": "TOPLEFT"}, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 311.654, "t": 86.74900000000002, "r": 321.672, "b": 91.46000000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 311.654, "r_y0": 91.46000000000004, "r_x1": 321.672, "r_y1": 91.46000000000004, "r_x2": 321.672, "r_y2": 86.74900000000002, "r_x3": 311.654, "r_y3": 86.74900000000002, "coord_origin": "TOPLEFT"}, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 287.894, "t": 141.904, "r": 328.809, "b": 146.615, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 287.894, "r_y0": 146.615, "r_x1": 328.809, "r_y1": 146.615, "r_x2": 328.809, "r_y2": 141.904, "r_x3": 287.894, "r_y3": 141.904, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 289.236, "t": 93.274, "r": 299.375, "b": 97.98500000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.236, "r_y0": 97.98500000000001, "r_x1": 299.375, "r_y1": 97.98500000000001, "r_x2": 299.375, "r_y2": 93.274, "r_x3": 289.236, "r_y3": 93.274, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 285.635, "t": 99.394, "r": 299.373, "b": 104.10500000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.635, "r_y0": 104.10500000000002, "r_x1": 299.373, "r_y1": 104.10500000000002, "r_x2": 299.373, "r_y2": 99.394, "r_x3": 285.635, "r_y3": 99.394, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 285.261, "t": 105.51400000000001, "r": 299.375, "b": 110.22500000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.261, "r_y0": 110.22500000000002, "r_x1": 299.375, "r_y1": 110.22500000000002, "r_x2": 299.375, "r_y2": 105.51400000000001, "r_x3": 285.261, "r_y3": 105.51400000000001, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 285.431, "t": 120.58399999999995, "r": 299.169, "b": 125.29499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.431, "r_y0": 125.29499999999996, "r_x1": 299.169, "r_y1": 125.29499999999996, "r_x2": 299.169, "r_y2": 120.58399999999995, "r_x3": 285.431, "r_y3": 120.58399999999995, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 285.057, "t": 126.70399999999995, "r": 299.171, "b": 131.41499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.057, "r_y0": 131.41499999999996, "r_x1": 299.171, "r_y1": 131.41499999999996, "r_x2": 299.171, "r_y2": 126.70399999999995, "r_x3": 285.057, "r_y3": 126.70399999999995, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 299.584, "t": 86.88699999999994, "r": 309.602, "b": 91.59799999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 299.584, "r_y0": 91.59799999999996, "r_x1": 309.602, "r_y1": 91.59799999999996, "r_x2": 309.602, "r_y2": 86.88699999999994, "r_x3": 299.584, "r_y3": 86.88699999999994, "coord_origin": "TOPLEFT"}, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 466.041, "t": 141.86599999999999, "r": 483.504, "b": 146.57600000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.041, "r_y0": 146.57600000000002, "r_x1": 483.504, "r_y1": 146.57600000000002, "r_x2": 483.504, "r_y2": 141.86599999999999, "r_x3": 466.041, "r_y3": 141.86599999999999, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 82, "label": "text", "bbox": {"l": 459.022, "t": 93.95500000000004, "r": 469.16, "b": 98.66600000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.022, "r_y0": 98.66600000000005, "r_x1": 469.16, "r_y1": 98.66600000000005, "r_x2": 469.16, "r_y2": 93.95500000000004, "r_x3": 459.022, "r_y3": 93.95500000000004, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 83, "label": "text", "bbox": {"l": 455.421, "t": 100.07500000000005, "r": 469.159, "b": 104.78599999999994, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.421, "r_y0": 104.78599999999994, "r_x1": 469.159, "r_y1": 104.78599999999994, "r_x2": 469.159, "r_y2": 100.07500000000005, "r_x3": 455.421, "r_y3": 100.07500000000005, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 455.047, "t": 106.19500000000005, "r": 469.161, "b": 110.90599999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.047, "r_y0": 110.90599999999995, "r_x1": 469.161, "r_y1": 110.90599999999995, "r_x2": 469.161, "r_y2": 106.19500000000005, "r_x3": 455.047, "r_y3": 106.19500000000005, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 467.394, "t": 85.76599999999996, "r": 480.655, "b": 90.47699999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 467.394, "r_y0": 90.47699999999998, "r_x1": 480.655, "r_y1": 90.47699999999998, "r_x2": 480.655, "r_y2": 85.76599999999996, "r_x3": 467.394, "r_y3": 85.76599999999996, "coord_origin": "TOPLEFT"}, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 86, "label": "text", "bbox": {"l": 160.377, "t": 141.77800000000002, "r": 202.841, "b": 146.61599999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.377, "r_y0": 146.48900000000003, "r_x1": 202.841, "r_y1": 146.61599999999999, "r_x2": 202.841, "r_y2": 141.90499999999997, "r_x3": 160.377, "r_y3": 141.77800000000002, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 153.743, "t": 95.05899999999997, "r": 173.327, "b": 99.76999999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.743, "r_y0": 99.76999999999998, "r_x1": 173.327, "r_y1": 99.76999999999998, "r_x2": 173.327, "r_y2": 95.05899999999997, "r_x3": 153.743, "r_y3": 95.05899999999997, "coord_origin": "TOPLEFT"}, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 88, "label": "text", "bbox": {"l": 154.51, "t": 101.17899999999997, "r": 173.325, "b": 105.88999999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.51, "r_y0": 105.88999999999999, "r_x1": 173.325, "r_y1": 105.88999999999999, "r_x2": 173.325, "r_y2": 101.17899999999997, "r_x3": 154.51, "r_y3": 101.17899999999997, "coord_origin": "TOPLEFT"}, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 155.272, "t": 107.29899999999998, "r": 173.327, "b": 112.00999999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.272, "r_y0": 112.00999999999999, "r_x1": 173.327, "r_y1": 112.00999999999999, "r_x2": 173.327, "r_y2": 107.29899999999998, "r_x3": 155.272, "r_y3": 107.29899999999998, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 326.413, "t": 107.42600000000004, "r": 345.997, "b": 112.13699999999994, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.413, "r_y0": 112.13699999999994, "r_x1": 345.997, "r_y1": 112.13699999999994, "r_x2": 345.997, "r_y2": 107.42600000000004, "r_x3": 326.413, "r_y3": 107.42600000000004, "coord_origin": "TOPLEFT"}, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 91, "label": "text", "bbox": {"l": 327.18, "t": 113.54600000000005, "r": 345.995, "b": 118.25699999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.18, "r_y0": 118.25699999999995, "r_x1": 345.995, "r_y1": 118.25699999999995, "r_x2": 345.995, "r_y2": 113.54600000000005, "r_x3": 327.18, "r_y3": 113.54600000000005, "coord_origin": "TOPLEFT"}, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 92, "label": "text", "bbox": {"l": 327.941, "t": 119.66600000000005, "r": 345.996, "b": 124.37699999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.941, "r_y0": 124.37699999999995, "r_x1": 345.996, "r_y1": 124.37699999999995, "r_x2": 345.996, "r_y2": 119.66600000000005, "r_x3": 327.941, "r_y3": 119.66600000000005, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 93, "label": "text", "bbox": {"l": 488.994, "t": 104.34799999999996, "r": 508.764, "b": 109.05899999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.994, "r_y0": 109.05899999999997, "r_x1": 508.764, "r_y1": 109.05899999999997, "r_x2": 508.764, "r_y2": 104.34799999999996, "r_x3": 488.994, "r_y3": 104.34799999999996, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 94, "label": "text", "bbox": {"l": 490.189, "t": 110.46799999999996, "r": 508.764, "b": 115.17899999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.189, "r_y0": 115.17899999999997, "r_x1": 508.764, "r_y1": 115.17899999999997, "r_x2": 508.764, "r_y2": 110.46799999999996, "r_x3": 490.189, "r_y3": 110.46799999999996, "coord_origin": "TOPLEFT"}, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 95, "label": "text", "bbox": {"l": 489.72, "t": 116.58799999999997, "r": 508.768, "b": 121.29899999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.72, "r_y0": 121.29899999999998, "r_x1": 508.768, "r_y1": 121.29899999999998, "r_x2": 508.768, "r_y2": 116.58799999999997, "r_x3": 489.72, "r_y3": 116.58799999999997, "coord_origin": "TOPLEFT"}, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 96, "label": "text", "bbox": {"l": 490.711, "t": 122.70799999999997, "r": 508.766, "b": 127.41899999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.711, "r_y0": 127.41899999999998, "r_x1": 508.766, "r_y1": 127.41899999999998, "r_x2": 508.766, "r_y2": 122.70799999999997, "r_x3": 490.711, "r_y3": 122.70799999999997, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 97, "label": "text", "bbox": {"l": 168.504, "t": 86.28899999999999, "r": 197.527, "b": 91.04100000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.504, "r_y0": 91.04100000000005, "r_x1": 197.527, "r_y1": 91.0, "r_x2": 197.527, "r_y2": 86.28899999999999, "r_x3": 168.504, "r_y3": 86.33000000000004, "coord_origin": "TOPLEFT"}, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 98, "label": "text", "bbox": {"l": 357.377, "t": 86.19100000000003, "r": 367.395, "b": 90.90200000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.377, "r_y0": 90.90200000000004, "r_x1": 367.395, "r_y1": 90.90200000000004, "r_x2": 367.395, "r_y2": 86.19100000000003, "r_x3": 357.377, "r_y3": 86.19100000000003, "coord_origin": "TOPLEFT"}, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 99, "label": "text", "bbox": {"l": 333.732, "t": 141.817, "r": 374.929, "b": 146.52800000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.732, "r_y0": 146.52800000000002, "r_x1": 374.929, "r_y1": 146.52800000000002, "r_x2": 374.929, "r_y2": 141.817, "r_x3": 333.732, "r_y3": 141.817, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 100, "label": "text", "bbox": {"l": 345.691, "t": 86.25, "r": 355.709, "b": 90.96100000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.691, "r_y0": 90.96100000000001, "r_x1": 355.709, "r_y1": 90.96100000000001, "r_x2": 355.709, "r_y2": 86.25, "r_x3": 345.691, "r_y3": 86.25, "coord_origin": "TOPLEFT"}, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 101, "label": "text", "bbox": {"l": 508.543, "t": 141.57100000000003, "r": 526.006, "b": 146.28200000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 508.543, "r_y0": 146.28200000000004, "r_x1": 526.006, "r_y1": 146.28200000000004, "r_x2": 526.006, "r_y2": 141.57100000000003, "r_x3": 508.543, "r_y3": 141.57100000000003, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 102, "label": "text", "bbox": {"l": 510.447, "t": 86.28599999999994, "r": 523.707, "b": 90.99699999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 510.447, "r_y0": 90.99699999999996, "r_x1": 523.707, "r_y1": 90.99699999999996, "r_x2": 523.707, "r_y2": 86.28599999999994, "r_x3": 510.447, "r_y3": 86.28599999999994, "coord_origin": "TOPLEFT"}, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "caption", "id": 1, "page_no": 11, "cluster": {"id": 1, "label": "caption", "bbox": {"l": 50.112, "t": 165.77099999999996, "r": 545.114, "b": 186.27800000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9661495685577393, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 174.32299999999998, "r_x1": 86.585, "r_y1": 174.32299999999998, "r_x2": 86.585, "r_y2": 165.77099999999996, "r_x3": 50.112, "r_y3": 165.77099999999996, "coord_origin": "TOPLEFT"}, "text": "Figure 7:", "orig": "Figure 7:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.832, "r_y0": 174.32299999999998, "r_x1": 545.114, "r_y1": 174.32299999999998, "r_x2": 545.114, "r_y2": 165.77099999999996, "r_x3": 92.832, "r_y3": 165.77099999999996, "coord_origin": "TOPLEFT"}, "text": "Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "orig": "Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 186.27800000000002, "r_x1": 513.522, "r_y1": 186.27800000000002, "r_x2": 513.522, "r_y2": 177.726, "r_x3": 50.112, "r_y3": 177.726, "coord_origin": "TOPLEFT"}, "text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split, strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity."}, {"label": "list_item", "id": 4, "page_no": 11, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 61.569, "t": 211.20000000000005, "r": 286.365, "b": 231.707, "coord_origin": "TOPLEFT"}, "confidence": 0.9621952772140503, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 219.75199999999995, "r_x1": 65.056, "r_y1": 219.75199999999995, "r_x2": 65.056, "r_y2": 211.20000000000005, "r_x3": 61.569, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 219.75199999999995, "r_x1": 286.365, "r_y1": 219.75199999999995, "r_x2": 286.365, "r_y2": 211.20000000000005, "r_x3": 70.037, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "TableFormer output does not include the table cell con-", "orig": "TableFormer output does not include the table cell con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 231.707, "r_x1": 87.472, "r_y1": 231.707, "r_x2": 87.472, "r_y2": 223.15499999999997, "r_x3": 70.037, "r_y3": 223.15499999999997, "coord_origin": "TOPLEFT"}, "text": "tent.", "orig": "tent.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u00b7 TableFormer output does not include the table cell content."}, {"label": "list_item", "id": 3, "page_no": 11, "cluster": {"id": 3, "label": "list_item", "bbox": {"l": 61.569, "t": 244.34000000000003, "r": 286.365, "b": 264.847, "coord_origin": "TOPLEFT"}, "confidence": 0.9629555344581604, "cells": [{"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 252.89200000000005, "r_x1": 65.056, "r_y1": 252.89200000000005, "r_x2": 65.056, "r_y2": 244.34000000000003, "r_x3": 61.569, "r_y3": 244.34000000000003, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 252.89200000000005, "r_x1": 286.365, "r_y1": 252.89200000000005, "r_x2": 286.365, "r_y2": 244.34000000000003, "r_x3": 70.037, "r_y3": 244.34000000000003, "coord_origin": "TOPLEFT"}, "text": "There are occasional inaccuracies in the predictions of", "orig": "There are occasional inaccuracies in the predictions of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 264.847, "r_x1": 150.415, "r_y1": 264.847, "r_x2": 150.415, "r_y2": 256.29499999999996, "r_x3": 70.037, "r_y3": 256.29499999999996, "coord_origin": "TOPLEFT"}, "text": "the bounding boxes.", "orig": "the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u00b7 There are occasional inaccuracies in the predictions of the bounding boxes."}, {"label": "text", "id": 0, "page_no": 11, "cluster": {"id": 0, "label": "text", "bbox": {"l": 50.112, "t": 279.472, "r": 286.365, "b": 395.621, "coord_origin": "TOPLEFT"}, "confidence": 0.9767085909843445, "cells": [{"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 288.024, "r_x1": 286.365, "r_y1": 288.024, "r_x2": 286.365, "r_y2": 279.472, "r_x3": 62.067, "r_y3": 279.472, "coord_origin": "TOPLEFT"}, "text": "However, it is possible to mitigate those limitations by", "orig": "However, it is possible to mitigate those limitations by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 299.979, "r_x1": 286.365, "r_y1": 299.979, "r_x2": 286.365, "r_y2": 291.427, "r_x3": 50.112, "r_y3": 291.427, "coord_origin": "TOPLEFT"}, "text": "combining the TableFormer predictions with the informa-", "orig": "combining the TableFormer predictions with the informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 311.934, "r_x1": 286.365, "r_y1": 311.934, "r_x2": 286.365, "r_y2": 303.382, "r_x3": 50.112, "r_y3": 303.382, "coord_origin": "TOPLEFT"}, "text": "tion already present inside a programmatic PDF document.", "orig": "tion already present inside a programmatic PDF document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 323.889, "r_x1": 123.387, "r_y1": 323.889, "r_x2": 123.387, "r_y2": 315.337, "r_x3": 50.112, "r_y3": 315.337, "coord_origin": "TOPLEFT"}, "text": "More specifically,", "orig": "More specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.348, "r_y0": 323.889, "r_x1": 286.365, "r_y1": 323.889, "r_x2": 286.365, "r_y2": 315.337, "r_x3": 128.348, "r_y3": 315.337, "coord_origin": "TOPLEFT"}, "text": "PDF documents can be seen as a se-", "orig": "PDF documents can be seen as a se-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 335.845, "r_x1": 286.365, "r_y1": 335.845, "r_x2": 286.365, "r_y2": 327.293, "r_x3": 50.112, "r_y3": 327.293, "coord_origin": "TOPLEFT"}, "text": "quence of PDF cells where each cell is described by its con-", "orig": "quence of PDF cells where each cell is described by its con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 347.8, "r_x1": 286.365, "r_y1": 347.8, "r_x2": 286.365, "r_y2": 339.248, "r_x3": 50.112, "r_y3": 339.248, "coord_origin": "TOPLEFT"}, "text": "tent and bounding box. If we are able to associate the PDF", "orig": "tent and bounding box. If we are able to associate the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 359.755, "r_x1": 286.365, "r_y1": 359.755, "r_x2": 286.365, "r_y2": 351.203, "r_x3": 50.112, "r_y3": 351.203, "coord_origin": "TOPLEFT"}, "text": "cells with the predicted table cells, we can directly link the", "orig": "cells with the predicted table cells, we can directly link the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 371.71, "r_x1": 286.365, "r_y1": 371.71, "r_x2": 286.365, "r_y2": 363.158, "r_x3": 50.112, "r_y3": 363.158, "coord_origin": "TOPLEFT"}, "text": "PDF cell content to the table cell structure and use the PDF", "orig": "PDF cell content to the table cell structure and use the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 383.665, "r_x1": 286.365, "r_y1": 383.665, "r_x2": 286.365, "r_y2": 375.113, "r_x3": 50.112, "r_y3": 375.113, "coord_origin": "TOPLEFT"}, "text": "bounding boxes to correct misalignments in the predicted", "orig": "bounding boxes to correct misalignments in the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 395.621, "r_x1": 154.56, "r_y1": 395.621, "r_x2": 154.56, "r_y2": 387.069, "r_x3": 50.112, "r_y3": 387.069, "coord_origin": "TOPLEFT"}, "text": "table cell bounding boxes.", "orig": "table cell bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "However, it is possible to mitigate those limitations by combining the TableFormer predictions with the information already present inside a programmatic PDF document. More specifically, PDF documents can be seen as a sequence of PDF cells where each cell is described by its content and bounding box. If we are able to associate the PDF cells with the predicted table cells, we can directly link the PDF cell content to the table cell structure and use the PDF bounding boxes to correct misalignments in the predicted table cell bounding boxes."}, {"label": "text", "id": 11, "page_no": 11, "cluster": {"id": 11, "label": "text", "bbox": {"l": 50.112, "t": 399.338, "r": 286.365, "b": 419.846, "coord_origin": "TOPLEFT"}, "confidence": 0.934766411781311, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 407.89, "r_x1": 286.365, "r_y1": 407.89, "r_x2": 286.365, "r_y2": 399.338, "r_x3": 62.067, "r_y3": 399.338, "coord_origin": "TOPLEFT"}, "text": "Here is a step-by-step description of the prediction post-", "orig": "Here is a step-by-step description of the prediction post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 419.846, "r_x1": 95.492, "r_y1": 419.846, "r_x2": 95.492, "r_y2": 411.294, "r_x3": 50.112, "r_y3": 411.294, "coord_origin": "TOPLEFT"}, "text": "processing:", "orig": "processing:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Here is a step-by-step description of the prediction postprocessing:"}, {"label": "list_item", "id": 20, "page_no": 11, "cluster": {"id": 20, "label": "list_item", "bbox": {"l": 50.112, "t": 423.564, "r": 286.365, "b": 456.026, "coord_origin": "TOPLEFT"}, "confidence": 0.8280702233314514, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 432.116, "r_x1": 286.365, "r_y1": 432.116, "r_x2": 286.365, "r_y2": 423.564, "r_x3": 62.067, "r_y3": 423.564, "coord_origin": "TOPLEFT"}, "text": "1. Get the minimal grid dimensions - number of rows and", "orig": "1. Get the minimal grid dimensions - number of rows and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 444.071, "r_x1": 218.779, "r_y1": 444.071, "r_x2": 218.779, "r_y2": 435.519, "r_x3": 50.112, "r_y3": 435.519, "coord_origin": "TOPLEFT"}, "text": "columns for the predicted table structure.", "orig": "columns for the predicted table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.796, "r_y0": 444.071, "r_x1": 286.365, "r_y1": 444.071, "r_x2": 286.365, "r_y2": 435.519, "r_x3": 224.796, "r_y3": 435.519, "coord_origin": "TOPLEFT"}, "text": "This represents", "orig": "This represents", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 456.026, "r_x1": 274.51, "r_y1": 456.026, "r_x2": 274.51, "r_y2": 447.474, "r_x3": 50.112, "r_y3": 447.474, "coord_origin": "TOPLEFT"}, "text": "the most granular grid for the underlying table structure.", "orig": "the most granular grid for the underlying table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1. Get the minimal grid dimensions - number of rows and columns for the predicted table structure. This represents the most granular grid for the underlying table structure."}, {"label": "list_item", "id": 2, "page_no": 11, "cluster": {"id": 2, "label": "list_item", "bbox": {"l": 50.112, "t": 459.744, "r": 286.365, "b": 504.161, "coord_origin": "TOPLEFT"}, "confidence": 0.9646760821342468, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 468.296, "r_x1": 69.539, "r_y1": 468.296, "r_x2": 69.539, "r_y2": 459.744, "r_x3": 62.067, "r_y3": 459.744, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 77.429, "r_y0": 468.296, "r_x1": 286.365, "r_y1": 468.296, "r_x2": 286.365, "r_y2": 459.744, "r_x3": 77.429, "r_y3": 459.744, "coord_origin": "TOPLEFT"}, "text": "Generate pair-wise matches between the bounding", "orig": "Generate pair-wise matches between the bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 480.251, "r_x1": 286.365, "r_y1": 480.251, "r_x2": 286.365, "r_y2": 471.699, "r_x3": 50.112, "r_y3": 471.699, "coord_origin": "TOPLEFT"}, "text": "boxes of the PDF cells and the predicted cells. The Intersec-", "orig": "boxes of the PDF cells and the predicted cells. The Intersec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 492.206, "r_x1": 286.365, "r_y1": 492.206, "r_x2": 286.365, "r_y2": 483.654, "r_x3": 50.112, "r_y3": 483.654, "coord_origin": "TOPLEFT"}, "text": "tion Over Union (IOU) metric is used to evaluate the quality", "orig": "tion Over Union (IOU) metric is used to evaluate the quality", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 504.161, "r_x1": 110.705, "r_y1": 504.161, "r_x2": 110.705, "r_y2": 495.609, "r_x3": 50.112, "r_y3": 495.609, "coord_origin": "TOPLEFT"}, "text": "of the matches.", "orig": "of the matches.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2. Generate pair-wise matches between the bounding boxes of the PDF cells and the predicted cells. The Intersection Over Union (IOU) metric is used to evaluate the quality of the matches."}, {"label": "list_item", "id": 10, "page_no": 11, "cluster": {"id": 10, "label": "list_item", "bbox": {"l": 50.112, "t": 507.879, "r": 286.365, "b": 528.387, "coord_origin": "TOPLEFT"}, "confidence": 0.9391399025917053, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 516.431, "r_x1": 69.539, "r_y1": 516.431, "r_x2": 69.539, "r_y2": 507.879, "r_x3": 62.067, "r_y3": 507.879, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 75.248, "r_y0": 516.431, "r_x1": 286.365, "r_y1": 516.431, "r_x2": 286.365, "r_y2": 507.879, "r_x3": 75.248, "r_y3": 507.879, "coord_origin": "TOPLEFT"}, "text": "Use a carefully selected IOU threshold to designate", "orig": "Use a carefully selected IOU threshold to designate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 528.387, "r_x1": 226.071, "r_y1": 528.387, "r_x2": 226.071, "r_y2": 519.835, "r_x3": 50.112, "r_y3": 519.835, "coord_origin": "TOPLEFT"}, "text": "the matches as 'good' ones and 'bad' ones.", "orig": "the matches as 'good' ones and 'bad' ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3. Use a carefully selected IOU threshold to designate the matches as 'good' ones and 'bad' ones."}, {"label": "list_item", "id": 8, "page_no": 11, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 50.112, "t": 532.104, "r": 286.365, "b": 564.567, "coord_origin": "TOPLEFT"}, "confidence": 0.9491708874702454, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 540.656, "r_x1": 76.453, "r_y1": 540.656, "r_x2": 76.453, "r_y2": 532.104, "r_x3": 62.067, "r_y3": 532.104, "coord_origin": "TOPLEFT"}, "text": "3.a.", "orig": "3.a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 80.587, "r_y0": 540.656, "r_x1": 286.365, "r_y1": 540.656, "r_x2": 286.365, "r_y2": 532.104, "r_x3": 80.587, "r_y3": 532.104, "coord_origin": "TOPLEFT"}, "text": "If all IOU scores in a column are below the thresh-", "orig": "If all IOU scores in a column are below the thresh-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 552.612, "r_x1": 286.365, "r_y1": 552.612, "r_x2": 286.365, "r_y2": 544.06, "r_x3": 50.112, "r_y3": 544.06, "coord_origin": "TOPLEFT"}, "text": "old, discard all predictions (structure and bounding boxes)", "orig": "old, discard all predictions (structure and bounding boxes)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 564.567, "r_x1": 114.032, "r_y1": 564.567, "r_x2": 114.032, "r_y2": 556.015, "r_x3": 50.112, "r_y3": 556.015, "coord_origin": "TOPLEFT"}, "text": "for that column.", "orig": "for that column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3.a. If all IOU scores in a column are below the threshold, discard all predictions (structure and bounding boxes) for that column."}, {"label": "list_item", "id": 5, "page_no": 11, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 50.112, "t": 568.285, "r": 286.365, "b": 600.7470000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9587163329124451, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 576.837, "r_x1": 69.539, "r_y1": 576.837, "r_x2": 69.539, "r_y2": 568.285, "r_x3": 62.067, "r_y3": 568.285, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.732, "r_y0": 576.837, "r_x1": 286.365, "r_y1": 576.837, "r_x2": 286.365, "r_y2": 568.285, "r_x3": 76.732, "r_y3": 568.285, "coord_origin": "TOPLEFT"}, "text": "Find the best-fitting content alignment for the pre-", "orig": "Find the best-fitting content alignment for the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 588.792, "r_x1": 286.365, "r_y1": 588.792, "r_x2": 286.365, "r_y2": 580.24, "r_x3": 50.112, "r_y3": 580.24, "coord_origin": "TOPLEFT"}, "text": "dicted cells with good IOU per each column. The alignment", "orig": "dicted cells with good IOU per each column. The alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 600.7470000000001, "r_x1": 278.704, "r_y1": 600.7470000000001, "r_x2": 278.704, "r_y2": 592.1949999999999, "r_x3": 50.112, "r_y3": 592.1949999999999, "coord_origin": "TOPLEFT"}, "text": "of the column can be identified by the following formula:", "orig": "of the column can be identified by the following formula:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4. Find the best-fitting content alignment for the predicted cells with good IOU per each column. The alignment of the column can be identified by the following formula:"}, {"label": "formula", "id": 12, "page_no": 11, "cluster": {"id": 12, "label": "formula", "bbox": {"l": 110.705, "t": 624.104, "r": 286.362, "b": 654.998, "coord_origin": "TOPLEFT"}, "confidence": 0.9298412799835205, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.028, "r_y0": 632.81, "r_x1": 157.952, "r_y1": 632.81, "r_x2": 157.952, "r_y2": 624.104, "r_x3": 112.028, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.715, "r_y0": 632.81, "r_x1": 203.496, "r_y1": 632.81, "r_x2": 203.496, "r_y2": 624.104, "r_x3": 160.715, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "= arg min", "orig": "= arg min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.585, "r_y0": 640.154, "r_x1": 189.145, "r_y1": 640.154, "r_x2": 189.145, "r_y2": 634.06, "r_x3": 185.585, "r_y3": 634.06, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 203.499, "r_y0": 632.668, "r_x1": 208.48, "r_y1": 632.668, "r_x2": 208.48, "r_y2": 624.104, "r_x3": 203.499, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.481, "r_y0": 632.81, "r_x1": 216.729, "r_y1": 632.81, "r_x2": 216.729, "r_y2": 624.104, "r_x3": 208.481, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.729, "r_y0": 633.734, "r_x1": 220.289, "r_y1": 633.734, "r_x2": 220.289, "r_y2": 627.64, "r_x3": 216.729, "r_y3": 627.64, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.787, "r_y0": 632.668, "r_x1": 225.768, "r_y1": 632.668, "r_x2": 225.768, "r_y2": 624.104, "r_x3": 220.787, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.705, "r_y0": 654.075, "r_x1": 118.953, "r_y1": 654.075, "r_x2": 118.953, "r_y2": 645.369, "r_x3": 110.705, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 118.953, "r_y0": 654.998, "r_x1": 122.513, "r_y1": 654.998, "r_x2": 122.513, "r_y2": 648.904, "r_x3": 118.953, "r_y3": 648.904, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.779, "r_y0": 654.075, "r_x1": 133.528, "r_y1": 654.075, "r_x2": 133.528, "r_y2": 645.369, "r_x3": 125.779, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 136.295, "r_y0": 654.075, "r_x1": 166.678, "r_y1": 654.075, "r_x2": 166.678, "r_y2": 645.369, "r_x3": 136.295, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "max x", "orig": "max x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 156.003, "r_y0": 653.933, "r_x1": 160.984, "r_y1": 653.933, "r_x2": 160.984, "r_y2": 645.369, "r_x3": 156.003, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.678, "r_y0": 654.998, "r_x1": 170.238, "r_y1": 654.998, "r_x2": 170.238, "r_y2": 648.904, "r_x3": 166.678, "r_y3": 648.904, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.736, "r_y0": 653.933, "r_x1": 185.678, "r_y1": 653.933, "r_x2": 185.678, "r_y2": 645.369, "r_x3": 170.736, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "} -", "orig": "} -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.894, "r_y0": 654.075, "r_x1": 216.729, "r_y1": 654.075, "r_x2": 216.729, "r_y2": 645.369, "r_x3": 187.894, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "min x", "orig": "min x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.054, "r_y0": 653.933, "r_x1": 211.035, "r_y1": 653.933, "r_x2": 211.035, "r_y2": 645.369, "r_x3": 206.054, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.729, "r_y0": 654.998, "r_x1": 220.289, "r_y1": 654.998, "r_x2": 220.289, "r_y2": 648.904, "r_x3": 216.729, "r_y3": 648.904, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.787, "r_y0": 653.933, "r_x1": 225.768, "r_y1": 653.933, "r_x2": 225.768, "r_y2": 645.369, "r_x3": 220.787, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.746, "r_y0": 643.706, "r_x1": 286.362, "r_y1": 643.706, "r_x2": 286.362, "r_y2": 635.154, "r_x3": 274.746, "r_y3": 635.154, "coord_origin": "TOPLEFT"}, "text": "(4)", "orig": "(4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "alignment = arg min c { D c } D c = max x { c } -min x { c } (4)"}, {"label": "text", "id": 7, "page_no": 11, "cluster": {"id": 7, "label": "text", "bbox": {"l": 50.112, "t": 668.016, "r": 286.362, "b": 688.841, "coord_origin": "TOPLEFT"}, "confidence": 0.9545555114746094, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 676.886, "r_x1": 74.451, "r_y1": 676.886, "r_x2": 74.451, "r_y2": 668.3340000000001, "r_x3": 50.112, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.336, "r_y0": 676.722, "r_x1": 82.648, "r_y1": 676.722, "r_x2": 82.648, "r_y2": 668.016, "r_x3": 78.336, "r_y3": 668.016, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.533, "r_y0": 676.886, "r_x1": 93.178, "r_y1": 676.886, "r_x2": 93.178, "r_y2": 668.3340000000001, "r_x3": 86.533, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 97.063, "r_y0": 676.886, "r_x1": 123.634, "r_y1": 676.886, "r_x2": 123.634, "r_y2": 668.3340000000001, "r_x3": 97.063, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "one of", "orig": "one of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 127.519, "r_y0": 676.58, "r_x1": 132.5, "r_y1": 676.58, "r_x2": 132.5, "r_y2": 668.016, "r_x3": 127.519, "r_y3": 668.016, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.501, "r_y0": 676.886, "r_x1": 148.272, "r_y1": 676.886, "r_x2": 148.272, "r_y2": 668.3340000000001, "r_x3": 132.501, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "left,", "orig": "left,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.506, "r_y0": 676.886, "r_x1": 187.644, "r_y1": 676.886, "r_x2": 187.644, "r_y2": 668.3340000000001, "r_x3": 152.506, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "centroid,", "orig": "centroid,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 191.878, "r_y0": 676.886, "r_x1": 210.697, "r_y1": 676.886, "r_x2": 210.697, "r_y2": 668.3340000000001, "r_x3": 191.878, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "right", "orig": "right", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.697, "r_y0": 676.58, "r_x1": 215.678, "r_y1": 676.58, "r_x2": 215.678, "r_y2": 668.016, "r_x3": 210.697, "r_y3": 668.016, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.563, "r_y0": 676.886, "r_x1": 233.949, "r_y1": 676.886, "r_x2": 233.949, "r_y2": 668.3340000000001, "r_x3": 219.563, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 237.835, "r_y0": 676.722, "r_x1": 243.529, "r_y1": 676.722, "r_x2": 243.529, "r_y2": 668.016, "r_x3": 237.835, "r_y3": 668.016, "coord_origin": "TOPLEFT"}, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.529, "r_y0": 677.645, "r_x1": 247.089, "r_y1": 677.645, "r_x2": 247.089, "r_y2": 671.551, "r_x3": 243.529, "r_y3": 671.551, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.473, "r_y0": 676.886, "r_x1": 258.118, "r_y1": 676.886, "r_x2": 258.118, "r_y2": 668.3340000000001, "r_x3": 251.473, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.003, "r_y0": 676.886, "r_x1": 286.362, "r_y1": 676.886, "r_x2": 286.362, "r_y2": 668.3340000000001, "r_x3": 262.003, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "the x-", "orig": "the x-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 688.841, "r_x1": 205.887, "r_y1": 688.841, "r_x2": 205.887, "r_y2": 680.289, "r_x3": 50.112, "r_y3": 680.289, "coord_origin": "TOPLEFT"}, "text": "coordinate for the corresponding point.", "orig": "coordinate for the corresponding point.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "where c is one of { left, centroid, right } and x c is the xcoordinate for the corresponding point."}, {"label": "list_item", "id": 13, "page_no": 11, "cluster": {"id": 13, "label": "list_item", "bbox": {"l": 50.112, "t": 692.559, "r": 286.365, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9260510206222534, "cells": [{"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 701.111, "r_x1": 69.539, "r_y1": 701.111, "r_x2": 69.539, "r_y2": 692.559, "r_x3": 62.067, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.274, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 76.274, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Use the alignment computed in step 4, to compute", "orig": "Use the alignment computed in step 4, to compute", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 94.605, "r_y1": 713.066, "r_x2": 94.605, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "the median", "orig": "the median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 97.599, "r_y0": 712.902, "r_x1": 103.293, "r_y1": 712.902, "r_x2": 103.293, "r_y2": 704.196, "r_x3": 97.599, "r_y3": 704.196, "coord_origin": "TOPLEFT"}, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.292, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 103.292, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "-coordinate for all table columns and the me-", "orig": "-coordinate for all table columns and the me-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5. Use the alignment computed in step 4, to compute the median x -coordinate for all table columns and the me-"}, {"label": "text", "id": 16, "page_no": 11, "cluster": {"id": 16, "label": "text", "bbox": {"l": 308.862, "t": 211.20000000000005, "r": 545.115, "b": 255.61800000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.8942298889160156, "cells": [{"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 219.75199999999995, "r_x1": 435.915, "r_y1": 219.75199999999995, "r_x2": 435.915, "r_y2": 211.20000000000005, "r_x3": 308.862, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "dian cell size for all table cells.", "orig": "dian cell size for all table cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.697, "r_y0": 219.75199999999995, "r_x1": 545.115, "r_y1": 219.75199999999995, "r_x2": 545.115, "r_y2": 211.20000000000005, "r_x3": 440.697, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "The usage of median dur-", "orig": "The usage of median dur-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 231.70799999999997, "r_x1": 545.115, "r_y1": 231.70799999999997, "r_x2": 545.115, "r_y2": 223.15599999999995, "r_x3": 308.862, "r_y3": 223.15599999999995, "coord_origin": "TOPLEFT"}, "text": "ing the computations, helps to eliminate outliers caused by", "orig": "ing the computations, helps to eliminate outliers caused by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 243.663, "r_x1": 545.115, "r_y1": 243.663, "r_x2": 545.115, "r_y2": 235.111, "r_x3": 308.862, "r_y3": 235.111, "coord_origin": "TOPLEFT"}, "text": "occasional column spans which are usually wider than the", "orig": "occasional column spans which are usually wider than the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 255.61800000000005, "r_x1": 339.577, "r_y1": 255.61800000000005, "r_x2": 339.577, "r_y2": 247.06600000000003, "r_x3": 308.862, "r_y3": 247.06600000000003, "coord_origin": "TOPLEFT"}, "text": "normal.", "orig": "normal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "dian cell size for all table cells. The usage of median during the computations, helps to eliminate outliers caused by occasional column spans which are usually wider than the normal."}, {"label": "list_item", "id": 9, "page_no": 11, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 308.862, "t": 259.371, "r": 545.115, "b": 279.87800000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9423392415046692, "cells": [{"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 267.923, "r_x1": 328.289, "r_y1": 267.923, "r_x2": 328.289, "r_y2": 259.371, "r_x3": 320.817, "r_y3": 259.371, "coord_origin": "TOPLEFT"}, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.884, "r_y0": 267.923, "r_x1": 545.115, "r_y1": 267.923, "r_x2": 545.115, "r_y2": 259.371, "r_x3": 334.884, "r_y3": 259.371, "coord_origin": "TOPLEFT"}, "text": "Snap all cells with bad IOU to their corresponding", "orig": "Snap all cells with bad IOU to their corresponding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 279.87800000000004, "r_x1": 338.192, "r_y1": 279.87800000000004, "r_x2": 338.192, "r_y2": 271.326, "r_x3": 308.862, "r_y3": 271.326, "coord_origin": "TOPLEFT"}, "text": "median", "orig": "median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.682, "r_y0": 279.71400000000006, "r_x1": 346.376, "r_y1": 279.71400000000006, "r_x2": 346.376, "r_y2": 271.00800000000004, "r_x3": 340.682, "r_y3": 271.00800000000004, "coord_origin": "TOPLEFT"}, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.376, "r_y0": 279.87800000000004, "r_x1": 453.723, "r_y1": 279.87800000000004, "r_x2": 453.723, "r_y2": 271.326, "r_x3": 346.376, "r_y3": 271.326, "coord_origin": "TOPLEFT"}, "text": "-coordinates and cell sizes.", "orig": "-coordinates and cell sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "6. Snap all cells with bad IOU to their corresponding median x -coordinates and cell sizes."}, {"label": "list_item", "id": 6, "page_no": 11, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 308.862, "t": 283.632, "r": 545.115, "b": 387.825, "coord_origin": "TOPLEFT"}, "confidence": 0.9562004804611206, "cells": [{"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 292.184, "r_x1": 328.289, "r_y1": 292.184, "r_x2": 328.289, "r_y2": 283.632, "r_x3": 320.817, "r_y3": 283.632, "coord_origin": "TOPLEFT"}, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.144, "r_y0": 292.184, "r_x1": 545.115, "r_y1": 292.184, "r_x2": 545.115, "r_y2": 283.632, "r_x3": 332.144, "r_y3": 283.632, "coord_origin": "TOPLEFT"}, "text": "Generate a new set of pair-wise matches between the", "orig": "Generate a new set of pair-wise matches between the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 304.139, "r_x1": 476.562, "r_y1": 304.139, "r_x2": 476.562, "r_y2": 295.587, "r_x3": 308.862, "r_y3": 295.587, "coord_origin": "TOPLEFT"}, "text": "corrected bounding boxes and PDF cells.", "orig": "corrected bounding boxes and PDF cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 482.082, "r_y0": 304.139, "r_x1": 545.115, "r_y1": 304.139, "r_x2": 545.115, "r_y2": 295.587, "r_x3": 482.082, "r_y3": 295.587, "coord_origin": "TOPLEFT"}, "text": "This time use a", "orig": "This time use a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 316.094, "r_x1": 545.115, "r_y1": 316.094, "r_x2": 545.115, "r_y2": 307.542, "r_x3": 308.862, "r_y3": 307.542, "coord_origin": "TOPLEFT"}, "text": "modified version of the IOU metric, where the area of the", "orig": "modified version of the IOU metric, where the area of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 328.049, "r_x1": 545.115, "r_y1": 328.049, "r_x2": 545.115, "r_y2": 319.497, "r_x3": 308.862, "r_y3": 319.497, "coord_origin": "TOPLEFT"}, "text": "intersection between the predicted and PDF cells is divided", "orig": "intersection between the predicted and PDF cells is divided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 340.005, "r_x1": 397.19, "r_y1": 340.005, "r_x2": 397.19, "r_y2": 331.453, "r_x3": 308.862, "r_y3": 331.453, "coord_origin": "TOPLEFT"}, "text": "by the PDF cell area.", "orig": "by the PDF cell area.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 403.656, "r_y0": 340.005, "r_x1": 545.115, "r_y1": 340.005, "r_x2": 545.115, "r_y2": 331.453, "r_x3": 403.656, "r_y3": 331.453, "coord_origin": "TOPLEFT"}, "text": "In case there are multiple matches", "orig": "In case there are multiple matches", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 351.96, "r_x1": 545.115, "r_y1": 351.96, "r_x2": 545.115, "r_y2": 343.408, "r_x3": 308.862, "r_y3": 343.408, "coord_origin": "TOPLEFT"}, "text": "for the same PDF cell, the prediction with the higher score", "orig": "for the same PDF cell, the prediction with the higher score", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 363.915, "r_x1": 357.26, "r_y1": 363.915, "r_x2": 357.26, "r_y2": 355.363, "r_x3": 308.862, "r_y3": 355.363, "coord_origin": "TOPLEFT"}, "text": "is preferred.", "orig": "is preferred.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 361.176, "r_y0": 363.915, "r_x1": 545.115, "r_y1": 363.915, "r_x2": 545.115, "r_y2": 355.363, "r_x3": 361.176, "r_y3": 355.363, "coord_origin": "TOPLEFT"}, "text": "This covers the cases where the PDF cells are", "orig": "This covers the cases where the PDF cells are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 375.87, "r_x1": 545.115, "r_y1": 375.87, "r_x2": 545.115, "r_y2": 367.318, "r_x3": 308.862, "r_y3": 367.318, "coord_origin": "TOPLEFT"}, "text": "smaller than the area of predicted or corrected prediction", "orig": "smaller than the area of predicted or corrected prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 387.825, "r_x1": 329.614, "r_y1": 387.825, "r_x2": 329.614, "r_y2": 379.273, "r_x3": 308.862, "r_y3": 379.273, "coord_origin": "TOPLEFT"}, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "7. Generate a new set of pair-wise matches between the corrected bounding boxes and PDF cells. This time use a modified version of the IOU metric, where the area of the intersection between the predicted and PDF cells is divided by the PDF cell area. In case there are multiple matches for the same PDF cell, the prediction with the higher score is preferred. This covers the cases where the PDF cells are smaller than the area of predicted or corrected prediction cells."}, {"label": "list_item", "id": 17, "page_no": 11, "cluster": {"id": 17, "label": "list_item", "bbox": {"l": 308.862, "t": 391.579, "r": 545.115, "b": 459.906, "coord_origin": "TOPLEFT"}, "confidence": 0.8719939589500427, "cells": [{"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 400.131, "r_x1": 328.289, "r_y1": 400.131, "r_x2": 328.289, "r_y2": 391.579, "r_x3": 320.817, "r_y3": 391.579, "coord_origin": "TOPLEFT"}, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.569, "r_y0": 400.131, "r_x1": 545.115, "r_y1": 400.131, "r_x2": 545.115, "r_y2": 391.579, "r_x3": 333.569, "r_y3": 391.579, "coord_origin": "TOPLEFT"}, "text": "In some rare occasions, we have noticed that Table-", "orig": "In some rare occasions, we have noticed that Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 412.086, "r_x1": 545.115, "r_y1": 412.086, "r_x2": 545.115, "r_y2": 403.534, "r_x3": 308.862, "r_y3": 403.534, "coord_origin": "TOPLEFT"}, "text": "Former can confuse a single column as two. When the post-", "orig": "Former can confuse a single column as two. When the post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 424.041, "r_x1": 545.115, "r_y1": 424.041, "r_x2": 545.115, "r_y2": 415.489, "r_x3": 308.862, "r_y3": 415.489, "coord_origin": "TOPLEFT"}, "text": "processing steps are applied, this results with two predicted", "orig": "processing steps are applied, this results with two predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 435.996, "r_x1": 488.109, "r_y1": 435.996, "r_x2": 488.109, "r_y2": 427.444, "r_x3": 308.862, "r_y3": 427.444, "coord_origin": "TOPLEFT"}, "text": "columns pointing to the same PDF column.", "orig": "columns pointing to the same PDF column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 494.336, "r_y0": 435.996, "r_x1": 545.115, "r_y1": 435.996, "r_x2": 545.115, "r_y2": 427.444, "r_x3": 494.336, "r_y3": 427.444, "coord_origin": "TOPLEFT"}, "text": "In such case", "orig": "In such case", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 447.951, "r_x1": 545.115, "r_y1": 447.951, "r_x2": 545.115, "r_y2": 439.399, "r_x3": 308.862, "r_y3": 439.399, "coord_origin": "TOPLEFT"}, "text": "we must de-duplicate the columns according to highest to-", "orig": "we must de-duplicate the columns according to highest to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 459.906, "r_x1": 426.182, "r_y1": 459.906, "r_x2": 426.182, "r_y2": 451.354, "r_x3": 308.862, "r_y3": 451.354, "coord_origin": "TOPLEFT"}, "text": "tal column intersection score.", "orig": "tal column intersection score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "8. In some rare occasions, we have noticed that TableFormer can confuse a single column as two. When the postprocessing steps are applied, this results with two predicted columns pointing to the same PDF column. In such case we must de-duplicate the columns according to highest total column intersection score."}, {"label": "list_item", "id": 15, "page_no": 11, "cluster": {"id": 15, "label": "list_item", "bbox": {"l": 308.862, "t": 463.66, "r": 545.115, "b": 567.8530000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9126082062721252, "cells": [{"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 472.212, "r_x1": 328.289, "r_y1": 472.212, "r_x2": 328.289, "r_y2": 463.66, "r_x3": 320.817, "r_y3": 463.66, "coord_origin": "TOPLEFT"}, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.629, "r_y0": 472.212, "r_x1": 478.505, "r_y1": 472.212, "r_x2": 478.505, "r_y2": 463.66, "r_x3": 333.629, "r_y3": 463.66, "coord_origin": "TOPLEFT"}, "text": "Pick up the remaining orphan cells.", "orig": "Pick up the remaining orphan cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.855, "r_y0": 472.212, "r_x1": 545.115, "r_y1": 472.212, "r_x2": 545.115, "r_y2": 463.66, "r_x3": 483.855, "r_y3": 463.66, "coord_origin": "TOPLEFT"}, "text": "There could be", "orig": "There could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 484.167, "r_x1": 545.115, "r_y1": 484.167, "r_x2": 545.115, "r_y2": 475.615, "r_x3": 308.862, "r_y3": 475.615, "coord_origin": "TOPLEFT"}, "text": "cases, when after applying all the previous post-processing", "orig": "cases, when after applying all the previous post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 496.122, "r_x1": 545.115, "r_y1": 496.122, "r_x2": 545.115, "r_y2": 487.57, "r_x3": 308.862, "r_y3": 487.57, "coord_origin": "TOPLEFT"}, "text": "steps, some PDF cells could still remain without any match", "orig": "steps, some PDF cells could still remain without any match", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 508.077, "r_x1": 381.898, "r_y1": 508.077, "r_x2": 381.898, "r_y2": 499.525, "r_x3": 308.862, "r_y3": 499.525, "coord_origin": "TOPLEFT"}, "text": "to predicted cells.", "orig": "to predicted cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 388.702, "r_y0": 508.077, "r_x1": 545.115, "r_y1": 508.077, "r_x2": 545.115, "r_y2": 499.525, "r_x3": 388.702, "r_y3": 499.525, "coord_origin": "TOPLEFT"}, "text": "However, it is still possible to deduce", "orig": "However, it is still possible to deduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 520.033, "r_x1": 545.115, "r_y1": 520.033, "r_x2": 545.115, "r_y2": 511.481, "r_x3": 308.862, "r_y3": 511.481, "coord_origin": "TOPLEFT"}, "text": "the correct matching for an orphan PDF cell by mapping its", "orig": "the correct matching for an orphan PDF cell by mapping its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 531.988, "r_x1": 483.576, "r_y1": 531.988, "r_x2": 483.576, "r_y2": 523.4359999999999, "r_x3": 308.862, "r_y3": 523.4359999999999, "coord_origin": "TOPLEFT"}, "text": "bounding box on the geometry of the grid.", "orig": "bounding box on the geometry of the grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.195, "r_y0": 531.988, "r_x1": 545.115, "r_y1": 531.988, "r_x2": 545.115, "r_y2": 523.4359999999999, "r_x3": 489.195, "r_y3": 523.4359999999999, "coord_origin": "TOPLEFT"}, "text": "This mapping", "orig": "This mapping", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 543.943, "r_x1": 545.115, "r_y1": 543.943, "r_x2": 545.115, "r_y2": 535.3910000000001, "r_x3": 308.862, "r_y3": 535.3910000000001, "coord_origin": "TOPLEFT"}, "text": "decides if the content of the orphan cell will be appended to", "orig": "decides if the content of the orphan cell will be appended to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 555.898, "r_x1": 545.115, "r_y1": 555.898, "r_x2": 545.115, "r_y2": 547.346, "r_x3": 308.862, "r_y3": 547.346, "coord_origin": "TOPLEFT"}, "text": "an already matched table cell, or a new table cell should be", "orig": "an already matched table cell, or a new table cell should be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 567.8530000000001, "r_x1": 442.221, "r_y1": 567.8530000000001, "r_x2": 442.221, "r_y2": 559.3009999999999, "r_x3": 308.862, "r_y3": 559.3009999999999, "coord_origin": "TOPLEFT"}, "text": "created to match with the orphan.", "orig": "created to match with the orphan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9. Pick up the remaining orphan cells. There could be cases, when after applying all the previous post-processing steps, some PDF cells could still remain without any match to predicted cells. However, it is still possible to deduce the correct matching for an orphan PDF cell by mapping its bounding box on the geometry of the grid. This mapping decides if the content of the orphan cell will be appended to an already matched table cell, or a new table cell should be created to match with the orphan."}, {"label": "text", "id": 19, "page_no": 11, "cluster": {"id": 19, "label": "text", "bbox": {"l": 308.862, "t": 571.607, "r": 545.117, "b": 604.069, "coord_origin": "TOPLEFT"}, "confidence": 0.8459473848342896, "cells": [{"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 580.159, "r_x1": 332.712, "r_y1": 580.159, "r_x2": 332.712, "r_y2": 571.607, "r_x3": 320.817, "r_y3": 571.607, "coord_origin": "TOPLEFT"}, "text": "9a.", "orig": "9a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.943, "r_y0": 580.159, "r_x1": 545.115, "r_y1": 580.159, "r_x2": 545.115, "r_y2": 571.607, "r_x3": 337.943, "r_y3": 571.607, "coord_origin": "TOPLEFT"}, "text": "Compute the top and bottom boundary of the hori-", "orig": "Compute the top and bottom boundary of the hori-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 592.114, "r_x1": 471.641, "r_y1": 592.114, "r_x2": 471.641, "r_y2": 583.562, "r_x3": 308.862, "r_y3": 583.562, "coord_origin": "TOPLEFT"}, "text": "zontal band for each grid row (min/max", "orig": "zontal band for each grid row (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 474.834, "r_y0": 591.95, "r_x1": 479.719, "r_y1": 591.95, "r_x2": 479.719, "r_y2": 583.244, "r_x3": 474.834, "r_y3": 583.244, "coord_origin": "TOPLEFT"}, "text": "y", "orig": "y", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.269, "r_y0": 592.114, "r_x1": 545.117, "r_y1": 592.114, "r_x2": 545.117, "r_y2": 583.562, "r_x3": 483.269, "r_y3": 583.562, "coord_origin": "TOPLEFT"}, "text": "coordinates per", "orig": "coordinates per", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 604.069, "r_x1": 329.913, "r_y1": 604.069, "r_x2": 329.913, "r_y2": 595.517, "r_x3": 308.862, "r_y3": 595.517, "coord_origin": "TOPLEFT"}, "text": "row).", "orig": "row).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9a. Compute the top and bottom boundary of the horizontal band for each grid row (min/max y coordinates per row)."}, {"label": "list_item", "id": 21, "page_no": 11, "cluster": {"id": 21, "label": "list_item", "bbox": {"l": 308.862, "t": 607.822, "r": 545.115, "b": 628.33, "coord_origin": "TOPLEFT"}, "confidence": 0.7716891169548035, "cells": [{"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 616.374, "r_x1": 332.872, "r_y1": 616.374, "r_x2": 332.872, "r_y2": 607.822, "r_x3": 320.817, "r_y3": 607.822, "coord_origin": "TOPLEFT"}, "text": "9b.", "orig": "9b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.925, "r_y0": 616.374, "r_x1": 374.226, "r_y1": 616.374, "r_x2": 374.226, "r_y2": 607.822, "r_x3": 339.925, "r_y3": 607.822, "coord_origin": "TOPLEFT"}, "text": "Intersect", "orig": "Intersect", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 378.042, "r_y0": 616.374, "r_x1": 545.115, "r_y1": 616.374, "r_x2": 545.115, "r_y2": 607.822, "r_x3": 378.042, "r_y3": 607.822, "coord_origin": "TOPLEFT"}, "text": "the orphan's bounding box with the row", "orig": "the orphan's bounding box with the row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 628.33, "r_x1": 495.292, "r_y1": 628.33, "r_x2": 495.292, "r_y2": 619.778, "r_x3": 308.862, "r_y3": 619.778, "coord_origin": "TOPLEFT"}, "text": "bands, and map the cell to the closest grid row.", "orig": "bands, and map the cell to the closest grid row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9b. Intersect the orphan's bounding box with the row bands, and map the cell to the closest grid row."}, {"label": "list_item", "id": 18, "page_no": 11, "cluster": {"id": 18, "label": "list_item", "bbox": {"l": 308.862, "t": 632.083, "r": 545.115, "b": 664.545, "coord_origin": "TOPLEFT"}, "confidence": 0.8584907054901123, "cells": [{"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 640.635, "r_x1": 332.712, "r_y1": 640.635, "r_x2": 332.712, "r_y2": 632.083, "r_x3": 320.817, "r_y3": 632.083, "coord_origin": "TOPLEFT"}, "text": "9c.", "orig": "9c.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.534, "r_y0": 640.635, "r_x1": 545.115, "r_y1": 640.635, "r_x2": 545.115, "r_y2": 632.083, "r_x3": 337.534, "r_y3": 632.083, "coord_origin": "TOPLEFT"}, "text": "Compute the left and right boundary of the vertical", "orig": "Compute the left and right boundary of the vertical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 652.59, "r_x1": 455.282, "r_y1": 652.59, "r_x2": 455.282, "r_y2": 644.038, "r_x3": 308.862, "r_y3": 644.038, "coord_origin": "TOPLEFT"}, "text": "band for each grid column (min/max", "orig": "band for each grid column (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 457.777, "r_y0": 652.4259999999999, "r_x1": 463.471, "r_y1": 652.4259999999999, "r_x2": 463.471, "r_y2": 643.72, "r_x3": 457.777, "r_y3": 643.72, "coord_origin": "TOPLEFT"}, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.971, "r_y0": 652.59, "r_x1": 545.114, "r_y1": 652.59, "r_x2": 545.114, "r_y2": 644.038, "r_x3": 465.971, "r_y3": 644.038, "coord_origin": "TOPLEFT"}, "text": "coordinates per col-", "orig": "coordinates per col-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 664.545, "r_x1": 332.384, "r_y1": 664.545, "r_x2": 332.384, "r_y2": 655.9929999999999, "r_x3": 308.862, "r_y3": 655.9929999999999, "coord_origin": "TOPLEFT"}, "text": "umn).", "orig": "umn).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9c. Compute the left and right boundary of the vertical band for each grid column (min/max x coordinates per column)."}, {"label": "list_item", "id": 22, "page_no": 11, "cluster": {"id": 22, "label": "list_item", "bbox": {"l": 308.862, "t": 668.299, "r": 545.115, "b": 688.806, "coord_origin": "TOPLEFT"}, "confidence": 0.7590745091438293, "cells": [{"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 676.851, "r_x1": 545.115, "r_y1": 676.851, "r_x2": 545.115, "r_y2": 668.299, "r_x3": 320.817, "r_y3": 668.299, "coord_origin": "TOPLEFT"}, "text": "9d. Intersect the orphan's bounding box with the column", "orig": "9d. Intersect the orphan's bounding box with the column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 688.806, "r_x1": 510.585, "r_y1": 688.806, "r_x2": 510.585, "r_y2": 680.254, "r_x3": 308.862, "r_y3": 680.254, "coord_origin": "TOPLEFT"}, "text": "bands, and map the cell to the closest grid column.", "orig": "bands, and map the cell to the closest grid column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9d. Intersect the orphan's bounding box with the column bands, and map the cell to the closest grid column."}, {"label": "list_item", "id": 25, "page_no": 11, "cluster": {"id": 25, "label": "list_item", "bbox": {"l": 308.862, "t": 692.559, "r": 545.115, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.6971189975738525, "cells": [{"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 320.817, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "9e. If the table cell under the identified row and column", "orig": "9e. If the table cell under the identified row and column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "is not empty, extend its content with the content of the or-", "orig": "is not empty, extend its content with the content of the or-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9e. If the table cell under the identified row and column is not empty, extend its content with the content of the or-"}, {"label": "page_footer", "id": 14, "page_no": 11, "cluster": {"id": 14, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9126598238945007, "cells": [{"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "12"}], "body": [{"label": "picture", "id": 30, "page_no": 11, "cluster": {"id": 30, "label": "picture", "bbox": {"l": 53.54227066040039, "t": 74.74854278564453, "r": 544.938232421875, "b": 147.59091186523438, "coord_origin": "TOPLEFT"}, "confidence": 0.6033818125724792, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.391, "r_y0": 83.19600000000003, "r_x1": 151.946, "r_y1": 83.19600000000003, "r_x2": 151.946, "r_y2": 77.543, "r_x3": 119.391, "r_y3": 77.543, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.346, "r_y0": 81.077, "r_x1": 59.327, "r_y1": 81.077, "r_x2": 59.327, "r_y2": 75.42399999999998, "r_x3": 53.346, "r_y3": 75.42399999999998, "coord_origin": "TOPLEFT"}, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.579, "r_y0": 83.34400000000005, "r_x1": 319.827, "r_y1": 83.34400000000005, "r_x2": 319.827, "r_y2": 77.69100000000003, "r_x3": 289.579, "r_y3": 77.69100000000003, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.373, "r_y0": 83.13999999999999, "r_x1": 481.759, "r_y1": 83.13999999999999, "r_x2": 481.759, "r_y2": 77.48699999999997, "r_x3": 448.373, "r_y3": 77.48699999999997, "coord_origin": "TOPLEFT"}, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.553, "r_y0": 146.18100000000004, "r_x1": 105.08, "r_y1": 146.18100000000004, "r_x2": 105.08, "r_y2": 141.47000000000003, "r_x3": 82.553, "r_y3": 141.47000000000003, "coord_origin": "TOPLEFT"}, "text": "Train Val", "orig": "Train Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 63.039, "r_y0": 106.00900000000001, "r_x1": 85.29, "r_y1": 106.00900000000001, "r_x2": 85.29, "r_y2": 101.298, "r_x3": 63.039, "r_y3": 101.298, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 67.768, "r_y0": 129.29999999999995, "r_x1": 85.231, "r_y1": 129.29999999999995, "r_x2": 85.231, "r_y2": 124.58900000000006, "r_x3": 67.768, "r_y3": 124.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.551, "r_y0": 107.44500000000005, "r_x1": 249.803, "r_y1": 107.44500000000005, "r_x2": 249.803, "r_y2": 102.73400000000004, "r_x3": 227.551, "r_y3": 102.73400000000004, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.199, "r_y0": 131.89099999999996, "r_x1": 249.662, "r_y1": 131.89099999999996, "r_x2": 249.662, "r_y2": 127.17999999999995, "r_x3": 232.199, "r_y3": 127.17999999999995, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.234, "r_y0": 118.95000000000005, "r_x1": 413.697, "r_y1": 118.95000000000005, "r_x2": 413.697, "r_y2": 114.23900000000003, "r_x3": 396.234, "r_y3": 114.23900000000003, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.938, "r_y0": 90.63800000000003, "r_x1": 76.151, "r_y1": 90.63800000000003, "r_x2": 76.151, "r_y2": 85.92700000000002, "r_x3": 60.938, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.305, "r_y0": 91.12800000000004, "r_x1": 106.992, "r_y1": 91.10699999999997, "r_x2": 106.992, "r_y2": 86.39599999999996, "r_x3": 82.305, "r_y3": 86.41700000000003, "coord_origin": "TOPLEFT"}, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.205, "r_y0": 146.51099999999997, "r_x1": 271.386, "r_y1": 146.51099999999997, "r_x2": 271.386, "r_y2": 141.79999999999995, "r_x3": 246.205, "r_y3": 141.79999999999995, "coord_origin": "TOPLEFT"}, "text": "Train Test", "orig": "Train Test", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.182, "r_y0": 146.51099999999997, "r_x1": 281.88, "r_y1": 146.51099999999997, "r_x2": 281.88, "r_y2": 141.79999999999995, "r_x3": 274.182, "r_y3": 141.79999999999995, "coord_origin": "TOPLEFT"}, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 226.698, "r_y0": 90.63800000000003, "r_x1": 241.912, "r_y1": 90.63800000000003, "r_x2": 241.912, "r_y2": 85.92700000000002, "r_x3": 226.698, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.939, "r_y0": 90.99300000000005, "r_x1": 282.494, "r_y1": 91.0, "r_x2": 282.494, "r_y2": 86.28899999999999, "r_x3": 249.939, "r_y3": 86.28200000000004, "coord_origin": "TOPLEFT"}, "text": "91K 10K10K", "orig": "91K 10K10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.194, "r_y0": 146.18100000000004, "r_x1": 434.278, "r_y1": 146.32799999999997, "r_x2": 434.278, "r_y2": 141.61699999999996, "r_x3": 410.194, "r_y3": 141.47000000000003, "coord_origin": "TOPLEFT"}, "text": "Train Test", "orig": "Train Test", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.991, "r_y0": 146.32799999999997, "r_x1": 444.689, "r_y1": 146.32799999999997, "r_x2": 444.689, "r_y2": 141.61699999999996, "r_x3": 436.991, "r_y3": 141.61699999999996, "coord_origin": "TOPLEFT"}, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.373, "r_y0": 90.63800000000003, "r_x1": 406.587, "r_y1": 90.63800000000003, "r_x2": 406.587, "r_y2": 85.92700000000002, "r_x3": 391.373, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.521, "r_y0": 91.12800000000004, "r_x1": 445.624, "r_y1": 91.16600000000005, "r_x2": 445.624, "r_y2": 86.45500000000004, "r_x3": 410.521, "r_y3": 86.41700000000003, "coord_origin": "TOPLEFT"}, "text": "130K 5K 10K", "orig": "130K 5K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.949, "r_y0": 146.19299999999998, "r_x1": 156.042, "r_y1": 146.341, "r_x2": 156.042, "r_y2": 141.63, "r_x3": 113.949, "r_y3": 141.48199999999997, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.916, "r_y0": 99.72299999999996, "r_x1": 127.054, "r_y1": 99.72299999999996, "r_x2": 127.054, "r_y2": 95.01199999999994, "r_x3": 116.916, "r_y3": 95.01199999999994, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.315, "r_y0": 105.84299999999996, "r_x1": 127.053, "r_y1": 105.84299999999996, "r_x2": 127.053, "r_y2": 101.13199999999995, "r_x3": 113.315, "r_y3": 101.13199999999995, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.941, "r_y0": 111.96299999999997, "r_x1": 127.055, "r_y1": 111.96299999999997, "r_x2": 127.055, "r_y2": 107.25199999999995, "r_x3": 112.941, "r_y3": 107.25199999999995, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.227, "r_y0": 127.51999999999998, "r_x1": 126.966, "r_y1": 127.51999999999998, "r_x2": 126.966, "r_y2": 122.80899999999997, "r_x3": 113.227, "r_y3": 122.80899999999997, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.854, "r_y0": 133.64, "r_x1": 126.968, "r_y1": 133.64, "r_x2": 126.968, "r_y2": 128.92899999999997, "r_x3": 112.854, "r_y3": 128.92899999999997, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.031, "r_y0": 91.17600000000004, "r_x1": 151.042, "r_y1": 91.17100000000005, "r_x2": 151.042, "r_y2": 86.46000000000004, "r_x3": 122.031, "r_y3": 86.46500000000003, "coord_origin": "TOPLEFT"}, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 311.654, "r_y0": 91.46000000000004, "r_x1": 321.672, "r_y1": 91.46000000000004, "r_x2": 321.672, "r_y2": 86.74900000000002, "r_x3": 311.654, "r_y3": 86.74900000000002, "coord_origin": "TOPLEFT"}, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 287.894, "r_y0": 146.615, "r_x1": 328.809, "r_y1": 146.615, "r_x2": 328.809, "r_y2": 141.904, "r_x3": 287.894, "r_y3": 141.904, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.236, "r_y0": 97.98500000000001, "r_x1": 299.375, "r_y1": 97.98500000000001, "r_x2": 299.375, "r_y2": 93.274, "r_x3": 289.236, "r_y3": 93.274, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.635, "r_y0": 104.10500000000002, "r_x1": 299.373, "r_y1": 104.10500000000002, "r_x2": 299.373, "r_y2": 99.394, "r_x3": 285.635, "r_y3": 99.394, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.261, "r_y0": 110.22500000000002, "r_x1": 299.375, "r_y1": 110.22500000000002, "r_x2": 299.375, "r_y2": 105.51400000000001, "r_x3": 285.261, "r_y3": 105.51400000000001, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.431, "r_y0": 125.29499999999996, "r_x1": 299.169, "r_y1": 125.29499999999996, "r_x2": 299.169, "r_y2": 120.58399999999995, "r_x3": 285.431, "r_y3": 120.58399999999995, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.057, "r_y0": 131.41499999999996, "r_x1": 299.171, "r_y1": 131.41499999999996, "r_x2": 299.171, "r_y2": 126.70399999999995, "r_x3": 285.057, "r_y3": 126.70399999999995, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 299.584, "r_y0": 91.59799999999996, "r_x1": 309.602, "r_y1": 91.59799999999996, "r_x2": 309.602, "r_y2": 86.88699999999994, "r_x3": 299.584, "r_y3": 86.88699999999994, "coord_origin": "TOPLEFT"}, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.041, "r_y0": 146.57600000000002, "r_x1": 483.504, "r_y1": 146.57600000000002, "r_x2": 483.504, "r_y2": 141.86599999999999, "r_x3": 466.041, "r_y3": 141.86599999999999, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.022, "r_y0": 98.66600000000005, "r_x1": 469.16, "r_y1": 98.66600000000005, "r_x2": 469.16, "r_y2": 93.95500000000004, "r_x3": 459.022, "r_y3": 93.95500000000004, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.421, "r_y0": 104.78599999999994, "r_x1": 469.159, "r_y1": 104.78599999999994, "r_x2": 469.159, "r_y2": 100.07500000000005, "r_x3": 455.421, "r_y3": 100.07500000000005, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.047, "r_y0": 110.90599999999995, "r_x1": 469.161, "r_y1": 110.90599999999995, "r_x2": 469.161, "r_y2": 106.19500000000005, "r_x3": 455.047, "r_y3": 106.19500000000005, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 467.394, "r_y0": 90.47699999999998, "r_x1": 480.655, "r_y1": 90.47699999999998, "r_x2": 480.655, "r_y2": 85.76599999999996, "r_x3": 467.394, "r_y3": 85.76599999999996, "coord_origin": "TOPLEFT"}, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.377, "r_y0": 146.48900000000003, "r_x1": 202.841, "r_y1": 146.61599999999999, "r_x2": 202.841, "r_y2": 141.90499999999997, "r_x3": 160.377, "r_y3": 141.77800000000002, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.743, "r_y0": 99.76999999999998, "r_x1": 173.327, "r_y1": 99.76999999999998, "r_x2": 173.327, "r_y2": 95.05899999999997, "r_x3": 153.743, "r_y3": 95.05899999999997, "coord_origin": "TOPLEFT"}, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.51, "r_y0": 105.88999999999999, "r_x1": 173.325, "r_y1": 105.88999999999999, "r_x2": 173.325, "r_y2": 101.17899999999997, "r_x3": 154.51, "r_y3": 101.17899999999997, "coord_origin": "TOPLEFT"}, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.272, "r_y0": 112.00999999999999, "r_x1": 173.327, "r_y1": 112.00999999999999, "r_x2": 173.327, "r_y2": 107.29899999999998, "r_x3": 155.272, "r_y3": 107.29899999999998, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.413, "r_y0": 112.13699999999994, "r_x1": 345.997, "r_y1": 112.13699999999994, "r_x2": 345.997, "r_y2": 107.42600000000004, "r_x3": 326.413, "r_y3": 107.42600000000004, "coord_origin": "TOPLEFT"}, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.18, "r_y0": 118.25699999999995, "r_x1": 345.995, "r_y1": 118.25699999999995, "r_x2": 345.995, "r_y2": 113.54600000000005, "r_x3": 327.18, "r_y3": 113.54600000000005, "coord_origin": "TOPLEFT"}, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.941, "r_y0": 124.37699999999995, "r_x1": 345.996, "r_y1": 124.37699999999995, "r_x2": 345.996, "r_y2": 119.66600000000005, "r_x3": 327.941, "r_y3": 119.66600000000005, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.994, "r_y0": 109.05899999999997, "r_x1": 508.764, "r_y1": 109.05899999999997, "r_x2": 508.764, "r_y2": 104.34799999999996, "r_x3": 488.994, "r_y3": 104.34799999999996, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.189, "r_y0": 115.17899999999997, "r_x1": 508.764, "r_y1": 115.17899999999997, "r_x2": 508.764, "r_y2": 110.46799999999996, "r_x3": 490.189, "r_y3": 110.46799999999996, "coord_origin": "TOPLEFT"}, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.72, "r_y0": 121.29899999999998, "r_x1": 508.768, "r_y1": 121.29899999999998, "r_x2": 508.768, "r_y2": 116.58799999999997, "r_x3": 489.72, "r_y3": 116.58799999999997, "coord_origin": "TOPLEFT"}, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.711, "r_y0": 127.41899999999998, "r_x1": 508.766, "r_y1": 127.41899999999998, "r_x2": 508.766, "r_y2": 122.70799999999997, "r_x3": 490.711, "r_y3": 122.70799999999997, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.504, "r_y0": 91.04100000000005, "r_x1": 197.527, "r_y1": 91.0, "r_x2": 197.527, "r_y2": 86.28899999999999, "r_x3": 168.504, "r_y3": 86.33000000000004, "coord_origin": "TOPLEFT"}, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.377, "r_y0": 90.90200000000004, "r_x1": 367.395, "r_y1": 90.90200000000004, "r_x2": 367.395, "r_y2": 86.19100000000003, "r_x3": 357.377, "r_y3": 86.19100000000003, "coord_origin": "TOPLEFT"}, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.732, "r_y0": 146.52800000000002, "r_x1": 374.929, "r_y1": 146.52800000000002, "r_x2": 374.929, "r_y2": 141.817, "r_x3": 333.732, "r_y3": 141.817, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.691, "r_y0": 90.96100000000001, "r_x1": 355.709, "r_y1": 90.96100000000001, "r_x2": 355.709, "r_y2": 86.25, "r_x3": 345.691, "r_y3": 86.25, "coord_origin": "TOPLEFT"}, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 508.543, "r_y0": 146.28200000000004, "r_x1": 526.006, "r_y1": 146.28200000000004, "r_x2": 526.006, "r_y2": 141.57100000000003, "r_x3": 508.543, "r_y3": 141.57100000000003, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 510.447, "r_y0": 90.99699999999996, "r_x1": 523.707, "r_y1": 90.99699999999996, "r_x2": 523.707, "r_y2": 86.28599999999994, "r_x3": 510.447, "r_y3": 86.28599999999994, "coord_origin": "TOPLEFT"}, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": [{"id": 46, "label": "text", "bbox": {"l": 119.391, "t": 77.543, "r": 151.946, "b": 83.19600000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 119.391, "r_y0": 83.19600000000003, "r_x1": 151.946, "r_y1": 83.19600000000003, "r_x2": 151.946, "r_y2": 77.543, "r_x3": 119.391, "r_y3": 77.543, "coord_origin": "TOPLEFT"}, "text": "PubTabNet", "orig": "PubTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 47, "label": "text", "bbox": {"l": 53.346, "t": 75.42399999999998, "r": 59.327, "b": 81.077, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 53.346, "r_y0": 81.077, "r_x1": 59.327, "r_y1": 81.077, "r_x2": 59.327, "r_y2": 75.42399999999998, "r_x3": 53.346, "r_y3": 75.42399999999998, "coord_origin": "TOPLEFT"}, "text": "b.", "orig": "b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 48, "label": "text", "bbox": {"l": 289.579, "t": 77.69100000000003, "r": 319.827, "b": 83.34400000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.579, "r_y0": 83.34400000000005, "r_x1": 319.827, "r_y1": 83.34400000000005, "r_x2": 319.827, "r_y2": 77.69100000000003, "r_x3": 289.579, "r_y3": 77.69100000000003, "coord_origin": "TOPLEFT"}, "text": "FinTabNet", "orig": "FinTabNet", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 49, "label": "text", "bbox": {"l": 448.373, "t": 77.48699999999997, "r": 481.759, "b": 83.13999999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 448.373, "r_y0": 83.13999999999999, "r_x1": 481.759, "r_y1": 83.13999999999999, "r_x2": 481.759, "r_y2": 77.48699999999997, "r_x3": 448.373, "r_y3": 77.48699999999997, "coord_origin": "TOPLEFT"}, "text": "Table Bank", "orig": "Table Bank", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 50, "label": "text", "bbox": {"l": 82.553, "t": 141.47000000000003, "r": 105.08, "b": 146.18100000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.553, "r_y0": 146.18100000000004, "r_x1": 105.08, "r_y1": 146.18100000000004, "r_x2": 105.08, "r_y2": 141.47000000000003, "r_x3": 82.553, "r_y3": 141.47000000000003, "coord_origin": "TOPLEFT"}, "text": "Train Val", "orig": "Train Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 51, "label": "text", "bbox": {"l": 63.039, "t": 101.298, "r": 85.29, "b": 106.00900000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 63.039, "r_y0": 106.00900000000001, "r_x1": 85.29, "r_y1": 106.00900000000001, "r_x2": 85.29, "r_y2": 101.298, "r_x3": 63.039, "r_y3": 101.298, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 52, "label": "text", "bbox": {"l": 67.768, "t": 124.58900000000006, "r": 85.231, "b": 129.29999999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 67.768, "r_y0": 129.29999999999995, "r_x1": 85.231, "r_y1": 129.29999999999995, "r_x2": 85.231, "r_y2": 124.58900000000006, "r_x3": 67.768, "r_y3": 124.58900000000006, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 53, "label": "text", "bbox": {"l": 227.551, "t": 102.73400000000004, "r": 249.803, "b": 107.44500000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 227.551, "r_y0": 107.44500000000005, "r_x1": 249.803, "r_y1": 107.44500000000005, "r_x2": 249.803, "r_y2": 102.73400000000004, "r_x3": 227.551, "r_y3": 102.73400000000004, "coord_origin": "TOPLEFT"}, "text": "Complex", "orig": "Complex", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 54, "label": "text", "bbox": {"l": 232.199, "t": 127.17999999999995, "r": 249.662, "b": 131.89099999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 232.199, "r_y0": 131.89099999999996, "r_x1": 249.662, "r_y1": 131.89099999999996, "r_x2": 249.662, "r_y2": 127.17999999999995, "r_x3": 232.199, "r_y3": 127.17999999999995, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 55, "label": "text", "bbox": {"l": 396.234, "t": 114.23900000000003, "r": 413.697, "b": 118.95000000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 396.234, "r_y0": 118.95000000000005, "r_x1": 413.697, "r_y1": 118.95000000000005, "r_x2": 413.697, "r_y2": 114.23900000000003, "r_x3": 396.234, "r_y3": 114.23900000000003, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 56, "label": "text", "bbox": {"l": 60.938, "t": 85.92700000000002, "r": 76.151, "b": 90.63800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 60.938, "r_y0": 90.63800000000003, "r_x1": 76.151, "r_y1": 90.63800000000003, "r_x2": 76.151, "r_y2": 85.92700000000002, "r_x3": 60.938, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 57, "label": "text", "bbox": {"l": 82.305, "t": 86.39599999999996, "r": 106.992, "b": 91.12800000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 82.305, "r_y0": 91.12800000000004, "r_x1": 106.992, "r_y1": 91.10699999999997, "r_x2": 106.992, "r_y2": 86.39599999999996, "r_x3": 82.305, "r_y3": 86.41700000000003, "coord_origin": "TOPLEFT"}, "text": "500K 10K", "orig": "500K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 58, "label": "text", "bbox": {"l": 246.205, "t": 141.79999999999995, "r": 271.386, "b": 146.51099999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 246.205, "r_y0": 146.51099999999997, "r_x1": 271.386, "r_y1": 146.51099999999997, "r_x2": 271.386, "r_y2": 141.79999999999995, "r_x3": 246.205, "r_y3": 141.79999999999995, "coord_origin": "TOPLEFT"}, "text": "Train Test", "orig": "Train Test", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 59, "label": "text", "bbox": {"l": 274.182, "t": 141.79999999999995, "r": 281.88, "b": 146.51099999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.182, "r_y0": 146.51099999999997, "r_x1": 281.88, "r_y1": 146.51099999999997, "r_x2": 281.88, "r_y2": 141.79999999999995, "r_x3": 274.182, "r_y3": 141.79999999999995, "coord_origin": "TOPLEFT"}, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 60, "label": "text", "bbox": {"l": 226.698, "t": 85.92700000000002, "r": 241.912, "b": 90.63800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 14, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 226.698, "r_y0": 90.63800000000003, "r_x1": 241.912, "r_y1": 90.63800000000003, "r_x2": 241.912, "r_y2": 85.92700000000002, "r_x3": 226.698, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 61, "label": "text", "bbox": {"l": 249.939, "t": 86.28200000000004, "r": 282.494, "b": 91.0, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 15, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 249.939, "r_y0": 90.99300000000005, "r_x1": 282.494, "r_y1": 91.0, "r_x2": 282.494, "r_y2": 86.28899999999999, "r_x3": 249.939, "r_y3": 86.28200000000004, "coord_origin": "TOPLEFT"}, "text": "91K 10K10K", "orig": "91K 10K10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 62, "label": "text", "bbox": {"l": 410.194, "t": 141.47000000000003, "r": 434.278, "b": 146.32799999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 16, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.194, "r_y0": 146.18100000000004, "r_x1": 434.278, "r_y1": 146.32799999999997, "r_x2": 434.278, "r_y2": 141.61699999999996, "r_x3": 410.194, "r_y3": 141.47000000000003, "coord_origin": "TOPLEFT"}, "text": "Train Test", "orig": "Train Test", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 63, "label": "text", "bbox": {"l": 436.991, "t": 141.61699999999996, "r": 444.689, "b": 146.32799999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 17, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 436.991, "r_y0": 146.32799999999997, "r_x1": 444.689, "r_y1": 146.32799999999997, "r_x2": 444.689, "r_y2": 141.61699999999996, "r_x3": 436.991, "r_y3": 141.61699999999996, "coord_origin": "TOPLEFT"}, "text": "Val", "orig": "Val", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 64, "label": "text", "bbox": {"l": 391.373, "t": 85.92700000000002, "r": 406.587, "b": 90.63800000000003, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 18, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.373, "r_y0": 90.63800000000003, "r_x1": 406.587, "r_y1": 90.63800000000003, "r_x2": 406.587, "r_y2": 85.92700000000002, "r_x3": 391.373, "r_y3": 85.92700000000002, "coord_origin": "TOPLEFT"}, "text": "100%", "orig": "100%", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 65, "label": "text", "bbox": {"l": 410.521, "t": 86.41700000000003, "r": 445.624, "b": 91.16600000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 19, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 410.521, "r_y0": 91.12800000000004, "r_x1": 445.624, "r_y1": 91.16600000000005, "r_x2": 445.624, "r_y2": 86.45500000000004, "r_x3": 410.521, "r_y3": 86.41700000000003, "coord_origin": "TOPLEFT"}, "text": "130K 5K 10K", "orig": "130K 5K 10K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 66, "label": "text", "bbox": {"l": 113.949, "t": 141.48199999999997, "r": 156.042, "b": 146.341, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 20, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.949, "r_y0": 146.19299999999998, "r_x1": 156.042, "r_y1": 146.341, "r_x2": 156.042, "r_y2": 141.63, "r_x3": 113.949, "r_y3": 141.48199999999997, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 67, "label": "text", "bbox": {"l": 116.916, "t": 95.01199999999994, "r": 127.054, "b": 99.72299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 21, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 116.916, "r_y0": 99.72299999999996, "r_x1": 127.054, "r_y1": 99.72299999999996, "r_x2": 127.054, "r_y2": 95.01199999999994, "r_x3": 116.916, "r_y3": 95.01199999999994, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 68, "label": "text", "bbox": {"l": 113.315, "t": 101.13199999999995, "r": 127.053, "b": 105.84299999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 22, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.315, "r_y0": 105.84299999999996, "r_x1": 127.053, "r_y1": 105.84299999999996, "r_x2": 127.053, "r_y2": 101.13199999999995, "r_x3": 113.315, "r_y3": 101.13199999999995, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 69, "label": "text", "bbox": {"l": 112.941, "t": 107.25199999999995, "r": 127.055, "b": 111.96299999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 23, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.941, "r_y0": 111.96299999999997, "r_x1": 127.055, "r_y1": 111.96299999999997, "r_x2": 127.055, "r_y2": 107.25199999999995, "r_x3": 112.941, "r_y3": 107.25199999999995, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 70, "label": "text", "bbox": {"l": 113.227, "t": 122.80899999999997, "r": 126.966, "b": 127.51999999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 24, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 113.227, "r_y0": 127.51999999999998, "r_x1": 126.966, "r_y1": 127.51999999999998, "r_x2": 126.966, "r_y2": 122.80899999999997, "r_x3": 113.227, "r_y3": 122.80899999999997, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 71, "label": "text", "bbox": {"l": 112.854, "t": 128.92899999999997, "r": 126.968, "b": 133.64, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 25, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.854, "r_y0": 133.64, "r_x1": 126.968, "r_y1": 133.64, "r_x2": 126.968, "r_y2": 128.92899999999997, "r_x3": 112.854, "r_y3": 128.92899999999997, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 72, "label": "text", "bbox": {"l": 122.031, "t": 86.46000000000004, "r": 151.042, "b": 91.17600000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 26, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 122.031, "r_y0": 91.17600000000004, "r_x1": 151.042, "r_y1": 91.17100000000005, "r_x2": 151.042, "r_y2": 86.46000000000004, "r_x3": 122.031, "r_y3": 86.46500000000003, "coord_origin": "TOPLEFT"}, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 73, "label": "text", "bbox": {"l": 311.654, "t": 86.74900000000002, "r": 321.672, "b": 91.46000000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 27, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 311.654, "r_y0": 91.46000000000004, "r_x1": 321.672, "r_y1": 91.46000000000004, "r_x2": 321.672, "r_y2": 86.74900000000002, "r_x3": 311.654, "r_y3": 86.74900000000002, "coord_origin": "TOPLEFT"}, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 74, "label": "text", "bbox": {"l": 287.894, "t": 141.904, "r": 328.809, "b": 146.615, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 28, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 287.894, "r_y0": 146.615, "r_x1": 328.809, "r_y1": 146.615, "r_x2": 328.809, "r_y2": 141.904, "r_x3": 287.894, "r_y3": 141.904, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 75, "label": "text", "bbox": {"l": 289.236, "t": 93.274, "r": 299.375, "b": 97.98500000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 29, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 289.236, "r_y0": 97.98500000000001, "r_x1": 299.375, "r_y1": 97.98500000000001, "r_x2": 299.375, "r_y2": 93.274, "r_x3": 289.236, "r_y3": 93.274, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 76, "label": "text", "bbox": {"l": 285.635, "t": 99.394, "r": 299.373, "b": 104.10500000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 30, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.635, "r_y0": 104.10500000000002, "r_x1": 299.373, "r_y1": 104.10500000000002, "r_x2": 299.373, "r_y2": 99.394, "r_x3": 285.635, "r_y3": 99.394, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 77, "label": "text", "bbox": {"l": 285.261, "t": 105.51400000000001, "r": 299.375, "b": 110.22500000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 31, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.261, "r_y0": 110.22500000000002, "r_x1": 299.375, "r_y1": 110.22500000000002, "r_x2": 299.375, "r_y2": 105.51400000000001, "r_x3": 285.261, "r_y3": 105.51400000000001, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 78, "label": "text", "bbox": {"l": 285.431, "t": 120.58399999999995, "r": 299.169, "b": 125.29499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 32, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.431, "r_y0": 125.29499999999996, "r_x1": 299.169, "r_y1": 125.29499999999996, "r_x2": 299.169, "r_y2": 120.58399999999995, "r_x3": 285.431, "r_y3": 120.58399999999995, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 79, "label": "text", "bbox": {"l": 285.057, "t": 126.70399999999995, "r": 299.171, "b": 131.41499999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 33, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 285.057, "r_y0": 131.41499999999996, "r_x1": 299.171, "r_y1": 131.41499999999996, "r_x2": 299.171, "r_y2": 126.70399999999995, "r_x3": 285.057, "r_y3": 126.70399999999995, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 80, "label": "text", "bbox": {"l": 299.584, "t": 86.88699999999994, "r": 309.602, "b": 91.59799999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 34, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 299.584, "r_y0": 91.59799999999996, "r_x1": 309.602, "r_y1": 91.59799999999996, "r_x2": 309.602, "r_y2": 86.88699999999994, "r_x3": 299.584, "r_y3": 86.88699999999994, "coord_origin": "TOPLEFT"}, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 81, "label": "text", "bbox": {"l": 466.041, "t": 141.86599999999999, "r": 483.504, "b": 146.57600000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 35, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 466.041, "r_y0": 146.57600000000002, "r_x1": 483.504, "r_y1": 146.57600000000002, "r_x2": 483.504, "r_y2": 141.86599999999999, "r_x3": 466.041, "r_y3": 141.86599999999999, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 82, "label": "text", "bbox": {"l": 459.022, "t": 93.95500000000004, "r": 469.16, "b": 98.66600000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 36, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 459.022, "r_y0": 98.66600000000005, "r_x1": 469.16, "r_y1": 98.66600000000005, "r_x2": 469.16, "r_y2": 93.95500000000004, "r_x3": 459.022, "r_y3": 93.95500000000004, "coord_origin": "TOPLEFT"}, "text": "Non", "orig": "Non", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 83, "label": "text", "bbox": {"l": 455.421, "t": 100.07500000000005, "r": 469.159, "b": 104.78599999999994, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 37, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.421, "r_y0": 104.78599999999994, "r_x1": 469.159, "r_y1": 104.78599999999994, "r_x2": 469.159, "r_y2": 100.07500000000005, "r_x3": 455.421, "r_y3": 100.07500000000005, "coord_origin": "TOPLEFT"}, "text": "Strict", "orig": "Strict", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 84, "label": "text", "bbox": {"l": 455.047, "t": 106.19500000000005, "r": 469.161, "b": 110.90599999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 38, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 455.047, "r_y0": 110.90599999999995, "r_x1": 469.161, "r_y1": 110.90599999999995, "r_x2": 469.161, "r_y2": 106.19500000000005, "r_x3": 455.047, "r_y3": 106.19500000000005, "coord_origin": "TOPLEFT"}, "text": "HTML", "orig": "HTML", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 85, "label": "text", "bbox": {"l": 467.394, "t": 85.76599999999996, "r": 480.655, "b": 90.47699999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 39, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 467.394, "r_y0": 90.47699999999998, "r_x1": 480.655, "r_y1": 90.47699999999998, "r_x2": 480.655, "r_y2": 85.76599999999996, "r_x3": 467.394, "r_y3": 85.76599999999996, "coord_origin": "TOPLEFT"}, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 86, "label": "text", "bbox": {"l": 160.377, "t": 141.77800000000002, "r": 202.841, "b": 146.61599999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 40, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.377, "r_y0": 146.48900000000003, "r_x1": 202.841, "r_y1": 146.61599999999999, "r_x2": 202.841, "r_y2": 141.90499999999997, "r_x3": 160.377, "r_y3": 141.77800000000002, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 87, "label": "text", "bbox": {"l": 153.743, "t": 95.05899999999997, "r": 173.327, "b": 99.76999999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 41, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 153.743, "r_y0": 99.76999999999998, "r_x1": 173.327, "r_y1": 99.76999999999998, "r_x2": 173.327, "r_y2": 95.05899999999997, "r_x3": 153.743, "r_y3": 95.05899999999997, "coord_origin": "TOPLEFT"}, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 88, "label": "text", "bbox": {"l": 154.51, "t": 101.17899999999997, "r": 173.325, "b": 105.88999999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 42, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 154.51, "r_y0": 105.88999999999999, "r_x1": 173.325, "r_y1": 105.88999999999999, "r_x2": 173.325, "r_y2": 101.17899999999997, "r_x3": 154.51, "r_y3": 101.17899999999997, "coord_origin": "TOPLEFT"}, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 89, "label": "text", "bbox": {"l": 155.272, "t": 107.29899999999998, "r": 173.327, "b": 112.00999999999999, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 43, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 155.272, "r_y0": 112.00999999999999, "r_x1": 173.327, "r_y1": 112.00999999999999, "r_x2": 173.327, "r_y2": 107.29899999999998, "r_x3": 155.272, "r_y3": 107.29899999999998, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 90, "label": "text", "bbox": {"l": 326.413, "t": 107.42600000000004, "r": 345.997, "b": 112.13699999999994, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 44, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 326.413, "r_y0": 112.13699999999994, "r_x1": 345.997, "r_y1": 112.13699999999994, "r_x2": 345.997, "r_y2": 107.42600000000004, "r_x3": 326.413, "r_y3": 107.42600000000004, "coord_origin": "TOPLEFT"}, "text": "Contain", "orig": "Contain", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 91, "label": "text", "bbox": {"l": 327.18, "t": 113.54600000000005, "r": 345.995, "b": 118.25699999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 45, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.18, "r_y0": 118.25699999999995, "r_x1": 345.995, "r_y1": 118.25699999999995, "r_x2": 345.995, "r_y2": 113.54600000000005, "r_x3": 327.18, "r_y3": 113.54600000000005, "coord_origin": "TOPLEFT"}, "text": "Missing", "orig": "Missing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 92, "label": "text", "bbox": {"l": 327.941, "t": 119.66600000000005, "r": 345.996, "b": 124.37699999999995, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 46, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 327.941, "r_y0": 124.37699999999995, "r_x1": 345.996, "r_y1": 124.37699999999995, "r_x2": 345.996, "r_y2": 119.66600000000005, "r_x3": 327.941, "r_y3": 119.66600000000005, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 93, "label": "text", "bbox": {"l": 488.994, "t": 104.34799999999996, "r": 508.764, "b": 109.05899999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 47, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 488.994, "r_y0": 109.05899999999997, "r_x1": 508.764, "r_y1": 109.05899999999997, "r_x2": 508.764, "r_y2": 104.34799999999996, "r_x3": 488.994, "r_y3": 104.34799999999996, "coord_origin": "TOPLEFT"}, "text": "Dataset", "orig": "Dataset", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 94, "label": "text", "bbox": {"l": 490.189, "t": 110.46799999999996, "r": 508.764, "b": 115.17899999999997, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 48, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.189, "r_y0": 115.17899999999997, "r_x1": 508.764, "r_y1": 115.17899999999997, "r_x2": 508.764, "r_y2": 110.46799999999996, "r_x3": 490.189, "r_y3": 110.46799999999996, "coord_origin": "TOPLEFT"}, "text": "doesn't", "orig": "doesn't", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 95, "label": "text", "bbox": {"l": 489.72, "t": 116.58799999999997, "r": 508.768, "b": 121.29899999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 49, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.72, "r_y0": 121.29899999999998, "r_x1": 508.768, "r_y1": 121.29899999999998, "r_x2": 508.768, "r_y2": 116.58799999999997, "r_x3": 489.72, "r_y3": 116.58799999999997, "coord_origin": "TOPLEFT"}, "text": "provide", "orig": "provide", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 96, "label": "text", "bbox": {"l": 490.711, "t": 122.70799999999997, "r": 508.766, "b": 127.41899999999998, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 50, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 490.711, "r_y0": 127.41899999999998, "r_x1": 508.766, "r_y1": 127.41899999999998, "r_x2": 508.766, "r_y2": 122.70799999999997, "r_x3": 490.711, "r_y3": 122.70799999999997, "coord_origin": "TOPLEFT"}, "text": "bboxes", "orig": "bboxes", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 97, "label": "text", "bbox": {"l": 168.504, "t": 86.28899999999999, "r": 197.527, "b": 91.04100000000005, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 51, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 168.504, "r_y0": 91.04100000000005, "r_x1": 197.527, "r_y1": 91.0, "r_x2": 197.527, "r_y2": 86.28899999999999, "r_x3": 168.504, "r_y3": 86.33000000000004, "coord_origin": "TOPLEFT"}, "text": "230K 280K", "orig": "230K 280K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 98, "label": "text", "bbox": {"l": 357.377, "t": 86.19100000000003, "r": 367.395, "b": 90.90200000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 52, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 357.377, "r_y0": 90.90200000000004, "r_x1": 367.395, "r_y1": 90.90200000000004, "r_x2": 367.395, "r_y2": 86.19100000000003, "r_x3": 357.377, "r_y3": 86.19100000000003, "coord_origin": "TOPLEFT"}, "text": "65K", "orig": "65K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 99, "label": "text", "bbox": {"l": 333.732, "t": 141.817, "r": 374.929, "b": 146.52800000000002, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 53, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.732, "r_y0": 146.52800000000002, "r_x1": 374.929, "r_y1": 146.52800000000002, "r_x2": 374.929, "r_y2": 141.817, "r_x3": 333.732, "r_y3": 141.817, "coord_origin": "TOPLEFT"}, "text": "Complex Simple", "orig": "Complex Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 100, "label": "text", "bbox": {"l": 345.691, "t": 86.25, "r": 355.709, "b": 90.96100000000001, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 54, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 345.691, "r_y0": 90.96100000000001, "r_x1": 355.709, "r_y1": 90.96100000000001, "r_x2": 355.709, "r_y2": 86.25, "r_x3": 345.691, "r_y3": 86.25, "coord_origin": "TOPLEFT"}, "text": "47K", "orig": "47K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 101, "label": "text", "bbox": {"l": 508.543, "t": 141.57100000000003, "r": 526.006, "b": 146.28200000000004, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 55, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 508.543, "r_y0": 146.28200000000004, "r_x1": 526.006, "r_y1": 146.28200000000004, "r_x2": 526.006, "r_y2": 141.57100000000003, "r_x3": 508.543, "r_y3": 141.57100000000003, "coord_origin": "TOPLEFT"}, "text": "Simple", "orig": "Simple", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 102, "label": "text", "bbox": {"l": 510.447, "t": 86.28599999999994, "r": 523.707, "b": 90.99699999999996, "coord_origin": "TOPLEFT"}, "confidence": 1.0, "cells": [{"index": 56, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 510.447, "r_y0": 90.99699999999996, "r_x1": 523.707, "r_y1": 90.99699999999996, "r_x2": 523.707, "r_y2": 86.28599999999994, "r_x3": 510.447, "r_y3": 86.28599999999994, "coord_origin": "TOPLEFT"}, "text": "145K", "orig": "145K", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}]}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "caption", "id": 1, "page_no": 11, "cluster": {"id": 1, "label": "caption", "bbox": {"l": 50.112, "t": 165.77099999999996, "r": 545.114, "b": 186.27800000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9661495685577393, "cells": [{"index": 57, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 174.32299999999998, "r_x1": 86.585, "r_y1": 174.32299999999998, "r_x2": 86.585, "r_y2": 165.77099999999996, "r_x3": 50.112, "r_y3": 165.77099999999996, "coord_origin": "TOPLEFT"}, "text": "Figure 7:", "orig": "Figure 7:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 58, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 92.832, "r_y0": 174.32299999999998, "r_x1": 545.114, "r_y1": 174.32299999999998, "r_x2": 545.114, "r_y2": 165.77099999999996, "r_x3": 92.832, "r_y3": 165.77099999999996, "coord_origin": "TOPLEFT"}, "text": "Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "orig": "Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 59, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 186.27800000000002, "r_x1": 513.522, "r_y1": 186.27800000000002, "r_x2": 513.522, "r_y2": 177.726, "r_x3": 50.112, "r_y3": 177.726, "coord_origin": "TOPLEFT"}, "text": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "orig": "strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 7: Distribution of the tables across different dimensions per dataset. Simple vs complex tables per dataset and split, strict vs non strict html structures per dataset and table complexity, missing bboxes per dataset and table complexity."}, {"label": "list_item", "id": 4, "page_no": 11, "cluster": {"id": 4, "label": "list_item", "bbox": {"l": 61.569, "t": 211.20000000000005, "r": 286.365, "b": 231.707, "coord_origin": "TOPLEFT"}, "confidence": 0.9621952772140503, "cells": [{"index": 60, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 219.75199999999995, "r_x1": 65.056, "r_y1": 219.75199999999995, "r_x2": 65.056, "r_y2": 211.20000000000005, "r_x3": 61.569, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 61, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 219.75199999999995, "r_x1": 286.365, "r_y1": 219.75199999999995, "r_x2": 286.365, "r_y2": 211.20000000000005, "r_x3": 70.037, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "TableFormer output does not include the table cell con-", "orig": "TableFormer output does not include the table cell con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 62, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 231.707, "r_x1": 87.472, "r_y1": 231.707, "r_x2": 87.472, "r_y2": 223.15499999999997, "r_x3": 70.037, "r_y3": 223.15499999999997, "coord_origin": "TOPLEFT"}, "text": "tent.", "orig": "tent.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u00b7 TableFormer output does not include the table cell content."}, {"label": "list_item", "id": 3, "page_no": 11, "cluster": {"id": 3, "label": "list_item", "bbox": {"l": 61.569, "t": 244.34000000000003, "r": 286.365, "b": 264.847, "coord_origin": "TOPLEFT"}, "confidence": 0.9629555344581604, "cells": [{"index": 63, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 61.569, "r_y0": 252.89200000000005, "r_x1": 65.056, "r_y1": 252.89200000000005, "r_x2": 65.056, "r_y2": 244.34000000000003, "r_x3": 61.569, "r_y3": 244.34000000000003, "coord_origin": "TOPLEFT"}, "text": "\u2022", "orig": "\u2022", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 64, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 252.89200000000005, "r_x1": 286.365, "r_y1": 252.89200000000005, "r_x2": 286.365, "r_y2": 244.34000000000003, "r_x3": 70.037, "r_y3": 244.34000000000003, "coord_origin": "TOPLEFT"}, "text": "There are occasional inaccuracies in the predictions of", "orig": "There are occasional inaccuracies in the predictions of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 65, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 70.037, "r_y0": 264.847, "r_x1": 150.415, "r_y1": 264.847, "r_x2": 150.415, "r_y2": 256.29499999999996, "r_x3": 70.037, "r_y3": 256.29499999999996, "coord_origin": "TOPLEFT"}, "text": "the bounding boxes.", "orig": "the bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "\u00b7 There are occasional inaccuracies in the predictions of the bounding boxes."}, {"label": "text", "id": 0, "page_no": 11, "cluster": {"id": 0, "label": "text", "bbox": {"l": 50.112, "t": 279.472, "r": 286.365, "b": 395.621, "coord_origin": "TOPLEFT"}, "confidence": 0.9767085909843445, "cells": [{"index": 66, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 288.024, "r_x1": 286.365, "r_y1": 288.024, "r_x2": 286.365, "r_y2": 279.472, "r_x3": 62.067, "r_y3": 279.472, "coord_origin": "TOPLEFT"}, "text": "However, it is possible to mitigate those limitations by", "orig": "However, it is possible to mitigate those limitations by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 67, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 299.979, "r_x1": 286.365, "r_y1": 299.979, "r_x2": 286.365, "r_y2": 291.427, "r_x3": 50.112, "r_y3": 291.427, "coord_origin": "TOPLEFT"}, "text": "combining the TableFormer predictions with the informa-", "orig": "combining the TableFormer predictions with the informa-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 68, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 311.934, "r_x1": 286.365, "r_y1": 311.934, "r_x2": 286.365, "r_y2": 303.382, "r_x3": 50.112, "r_y3": 303.382, "coord_origin": "TOPLEFT"}, "text": "tion already present inside a programmatic PDF document.", "orig": "tion already present inside a programmatic PDF document.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 69, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 323.889, "r_x1": 123.387, "r_y1": 323.889, "r_x2": 123.387, "r_y2": 315.337, "r_x3": 50.112, "r_y3": 315.337, "coord_origin": "TOPLEFT"}, "text": "More specifically,", "orig": "More specifically,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 70, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 128.348, "r_y0": 323.889, "r_x1": 286.365, "r_y1": 323.889, "r_x2": 286.365, "r_y2": 315.337, "r_x3": 128.348, "r_y3": 315.337, "coord_origin": "TOPLEFT"}, "text": "PDF documents can be seen as a se-", "orig": "PDF documents can be seen as a se-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 71, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 335.845, "r_x1": 286.365, "r_y1": 335.845, "r_x2": 286.365, "r_y2": 327.293, "r_x3": 50.112, "r_y3": 327.293, "coord_origin": "TOPLEFT"}, "text": "quence of PDF cells where each cell is described by its con-", "orig": "quence of PDF cells where each cell is described by its con-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 72, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 347.8, "r_x1": 286.365, "r_y1": 347.8, "r_x2": 286.365, "r_y2": 339.248, "r_x3": 50.112, "r_y3": 339.248, "coord_origin": "TOPLEFT"}, "text": "tent and bounding box. If we are able to associate the PDF", "orig": "tent and bounding box. If we are able to associate the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 73, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 359.755, "r_x1": 286.365, "r_y1": 359.755, "r_x2": 286.365, "r_y2": 351.203, "r_x3": 50.112, "r_y3": 351.203, "coord_origin": "TOPLEFT"}, "text": "cells with the predicted table cells, we can directly link the", "orig": "cells with the predicted table cells, we can directly link the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 74, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 371.71, "r_x1": 286.365, "r_y1": 371.71, "r_x2": 286.365, "r_y2": 363.158, "r_x3": 50.112, "r_y3": 363.158, "coord_origin": "TOPLEFT"}, "text": "PDF cell content to the table cell structure and use the PDF", "orig": "PDF cell content to the table cell structure and use the PDF", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 75, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 383.665, "r_x1": 286.365, "r_y1": 383.665, "r_x2": 286.365, "r_y2": 375.113, "r_x3": 50.112, "r_y3": 375.113, "coord_origin": "TOPLEFT"}, "text": "bounding boxes to correct misalignments in the predicted", "orig": "bounding boxes to correct misalignments in the predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 76, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 395.621, "r_x1": 154.56, "r_y1": 395.621, "r_x2": 154.56, "r_y2": 387.069, "r_x3": 50.112, "r_y3": 387.069, "coord_origin": "TOPLEFT"}, "text": "table cell bounding boxes.", "orig": "table cell bounding boxes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "However, it is possible to mitigate those limitations by combining the TableFormer predictions with the information already present inside a programmatic PDF document. More specifically, PDF documents can be seen as a sequence of PDF cells where each cell is described by its content and bounding box. If we are able to associate the PDF cells with the predicted table cells, we can directly link the PDF cell content to the table cell structure and use the PDF bounding boxes to correct misalignments in the predicted table cell bounding boxes."}, {"label": "text", "id": 11, "page_no": 11, "cluster": {"id": 11, "label": "text", "bbox": {"l": 50.112, "t": 399.338, "r": 286.365, "b": 419.846, "coord_origin": "TOPLEFT"}, "confidence": 0.934766411781311, "cells": [{"index": 77, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 407.89, "r_x1": 286.365, "r_y1": 407.89, "r_x2": 286.365, "r_y2": 399.338, "r_x3": 62.067, "r_y3": 399.338, "coord_origin": "TOPLEFT"}, "text": "Here is a step-by-step description of the prediction post-", "orig": "Here is a step-by-step description of the prediction post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 78, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 419.846, "r_x1": 95.492, "r_y1": 419.846, "r_x2": 95.492, "r_y2": 411.294, "r_x3": 50.112, "r_y3": 411.294, "coord_origin": "TOPLEFT"}, "text": "processing:", "orig": "processing:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Here is a step-by-step description of the prediction postprocessing:"}, {"label": "list_item", "id": 20, "page_no": 11, "cluster": {"id": 20, "label": "list_item", "bbox": {"l": 50.112, "t": 423.564, "r": 286.365, "b": 456.026, "coord_origin": "TOPLEFT"}, "confidence": 0.8280702233314514, "cells": [{"index": 79, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 432.116, "r_x1": 286.365, "r_y1": 432.116, "r_x2": 286.365, "r_y2": 423.564, "r_x3": 62.067, "r_y3": 423.564, "coord_origin": "TOPLEFT"}, "text": "1. Get the minimal grid dimensions - number of rows and", "orig": "1. Get the minimal grid dimensions - number of rows and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 80, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 444.071, "r_x1": 218.779, "r_y1": 444.071, "r_x2": 218.779, "r_y2": 435.519, "r_x3": 50.112, "r_y3": 435.519, "coord_origin": "TOPLEFT"}, "text": "columns for the predicted table structure.", "orig": "columns for the predicted table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 81, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 224.796, "r_y0": 444.071, "r_x1": 286.365, "r_y1": 444.071, "r_x2": 286.365, "r_y2": 435.519, "r_x3": 224.796, "r_y3": 435.519, "coord_origin": "TOPLEFT"}, "text": "This represents", "orig": "This represents", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 82, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 456.026, "r_x1": 274.51, "r_y1": 456.026, "r_x2": 274.51, "r_y2": 447.474, "r_x3": 50.112, "r_y3": 447.474, "coord_origin": "TOPLEFT"}, "text": "the most granular grid for the underlying table structure.", "orig": "the most granular grid for the underlying table structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "1. Get the minimal grid dimensions - number of rows and columns for the predicted table structure. This represents the most granular grid for the underlying table structure."}, {"label": "list_item", "id": 2, "page_no": 11, "cluster": {"id": 2, "label": "list_item", "bbox": {"l": 50.112, "t": 459.744, "r": 286.365, "b": 504.161, "coord_origin": "TOPLEFT"}, "confidence": 0.9646760821342468, "cells": [{"index": 83, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 468.296, "r_x1": 69.539, "r_y1": 468.296, "r_x2": 69.539, "r_y2": 459.744, "r_x3": 62.067, "r_y3": 459.744, "coord_origin": "TOPLEFT"}, "text": "2.", "orig": "2.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 84, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 77.429, "r_y0": 468.296, "r_x1": 286.365, "r_y1": 468.296, "r_x2": 286.365, "r_y2": 459.744, "r_x3": 77.429, "r_y3": 459.744, "coord_origin": "TOPLEFT"}, "text": "Generate pair-wise matches between the bounding", "orig": "Generate pair-wise matches between the bounding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 85, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 480.251, "r_x1": 286.365, "r_y1": 480.251, "r_x2": 286.365, "r_y2": 471.699, "r_x3": 50.112, "r_y3": 471.699, "coord_origin": "TOPLEFT"}, "text": "boxes of the PDF cells and the predicted cells. The Intersec-", "orig": "boxes of the PDF cells and the predicted cells. The Intersec-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 86, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 492.206, "r_x1": 286.365, "r_y1": 492.206, "r_x2": 286.365, "r_y2": 483.654, "r_x3": 50.112, "r_y3": 483.654, "coord_origin": "TOPLEFT"}, "text": "tion Over Union (IOU) metric is used to evaluate the quality", "orig": "tion Over Union (IOU) metric is used to evaluate the quality", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 87, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 504.161, "r_x1": 110.705, "r_y1": 504.161, "r_x2": 110.705, "r_y2": 495.609, "r_x3": 50.112, "r_y3": 495.609, "coord_origin": "TOPLEFT"}, "text": "of the matches.", "orig": "of the matches.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "2. Generate pair-wise matches between the bounding boxes of the PDF cells and the predicted cells. The Intersection Over Union (IOU) metric is used to evaluate the quality of the matches."}, {"label": "list_item", "id": 10, "page_no": 11, "cluster": {"id": 10, "label": "list_item", "bbox": {"l": 50.112, "t": 507.879, "r": 286.365, "b": 528.387, "coord_origin": "TOPLEFT"}, "confidence": 0.9391399025917053, "cells": [{"index": 88, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 516.431, "r_x1": 69.539, "r_y1": 516.431, "r_x2": 69.539, "r_y2": 507.879, "r_x3": 62.067, "r_y3": 507.879, "coord_origin": "TOPLEFT"}, "text": "3.", "orig": "3.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 89, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 75.248, "r_y0": 516.431, "r_x1": 286.365, "r_y1": 516.431, "r_x2": 286.365, "r_y2": 507.879, "r_x3": 75.248, "r_y3": 507.879, "coord_origin": "TOPLEFT"}, "text": "Use a carefully selected IOU threshold to designate", "orig": "Use a carefully selected IOU threshold to designate", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 90, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 528.387, "r_x1": 226.071, "r_y1": 528.387, "r_x2": 226.071, "r_y2": 519.835, "r_x3": 50.112, "r_y3": 519.835, "coord_origin": "TOPLEFT"}, "text": "the matches as 'good' ones and 'bad' ones.", "orig": "the matches as 'good' ones and 'bad' ones.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3. Use a carefully selected IOU threshold to designate the matches as 'good' ones and 'bad' ones."}, {"label": "list_item", "id": 8, "page_no": 11, "cluster": {"id": 8, "label": "list_item", "bbox": {"l": 50.112, "t": 532.104, "r": 286.365, "b": 564.567, "coord_origin": "TOPLEFT"}, "confidence": 0.9491708874702454, "cells": [{"index": 91, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 540.656, "r_x1": 76.453, "r_y1": 540.656, "r_x2": 76.453, "r_y2": 532.104, "r_x3": 62.067, "r_y3": 532.104, "coord_origin": "TOPLEFT"}, "text": "3.a.", "orig": "3.a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 92, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 80.587, "r_y0": 540.656, "r_x1": 286.365, "r_y1": 540.656, "r_x2": 286.365, "r_y2": 532.104, "r_x3": 80.587, "r_y3": 532.104, "coord_origin": "TOPLEFT"}, "text": "If all IOU scores in a column are below the thresh-", "orig": "If all IOU scores in a column are below the thresh-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 93, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 552.612, "r_x1": 286.365, "r_y1": 552.612, "r_x2": 286.365, "r_y2": 544.06, "r_x3": 50.112, "r_y3": 544.06, "coord_origin": "TOPLEFT"}, "text": "old, discard all predictions (structure and bounding boxes)", "orig": "old, discard all predictions (structure and bounding boxes)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 94, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 564.567, "r_x1": 114.032, "r_y1": 564.567, "r_x2": 114.032, "r_y2": 556.015, "r_x3": 50.112, "r_y3": 556.015, "coord_origin": "TOPLEFT"}, "text": "for that column.", "orig": "for that column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "3.a. If all IOU scores in a column are below the threshold, discard all predictions (structure and bounding boxes) for that column."}, {"label": "list_item", "id": 5, "page_no": 11, "cluster": {"id": 5, "label": "list_item", "bbox": {"l": 50.112, "t": 568.285, "r": 286.365, "b": 600.7470000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9587163329124451, "cells": [{"index": 95, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 576.837, "r_x1": 69.539, "r_y1": 576.837, "r_x2": 69.539, "r_y2": 568.285, "r_x3": 62.067, "r_y3": 568.285, "coord_origin": "TOPLEFT"}, "text": "4.", "orig": "4.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 96, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.732, "r_y0": 576.837, "r_x1": 286.365, "r_y1": 576.837, "r_x2": 286.365, "r_y2": 568.285, "r_x3": 76.732, "r_y3": 568.285, "coord_origin": "TOPLEFT"}, "text": "Find the best-fitting content alignment for the pre-", "orig": "Find the best-fitting content alignment for the pre-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 97, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 588.792, "r_x1": 286.365, "r_y1": 588.792, "r_x2": 286.365, "r_y2": 580.24, "r_x3": 50.112, "r_y3": 580.24, "coord_origin": "TOPLEFT"}, "text": "dicted cells with good IOU per each column. The alignment", "orig": "dicted cells with good IOU per each column. The alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 98, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 600.7470000000001, "r_x1": 278.704, "r_y1": 600.7470000000001, "r_x2": 278.704, "r_y2": 592.1949999999999, "r_x3": 50.112, "r_y3": 592.1949999999999, "coord_origin": "TOPLEFT"}, "text": "of the column can be identified by the following formula:", "orig": "of the column can be identified by the following formula:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "4. Find the best-fitting content alignment for the predicted cells with good IOU per each column. The alignment of the column can be identified by the following formula:"}, {"label": "formula", "id": 12, "page_no": 11, "cluster": {"id": 12, "label": "formula", "bbox": {"l": 110.705, "t": 624.104, "r": 286.362, "b": 654.998, "coord_origin": "TOPLEFT"}, "confidence": 0.9298412799835205, "cells": [{"index": 99, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 112.028, "r_y0": 632.81, "r_x1": 157.952, "r_y1": 632.81, "r_x2": 157.952, "r_y2": 624.104, "r_x3": 112.028, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "alignment", "orig": "alignment", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 100, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 160.715, "r_y0": 632.81, "r_x1": 203.496, "r_y1": 632.81, "r_x2": 203.496, "r_y2": 624.104, "r_x3": 160.715, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "= arg min", "orig": "= arg min", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 101, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 185.585, "r_y0": 640.154, "r_x1": 189.145, "r_y1": 640.154, "r_x2": 189.145, "r_y2": 634.06, "r_x3": 185.585, "r_y3": 634.06, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 102, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 203.499, "r_y0": 632.668, "r_x1": 208.48, "r_y1": 632.668, "r_x2": 208.48, "r_y2": 624.104, "r_x3": 203.499, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 103, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 208.481, "r_y0": 632.81, "r_x1": 216.729, "r_y1": 632.81, "r_x2": 216.729, "r_y2": 624.104, "r_x3": 208.481, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 104, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.729, "r_y0": 633.734, "r_x1": 220.289, "r_y1": 633.734, "r_x2": 220.289, "r_y2": 627.64, "r_x3": 216.729, "r_y3": 627.64, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 105, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.787, "r_y0": 632.668, "r_x1": 225.768, "r_y1": 632.668, "r_x2": 225.768, "r_y2": 624.104, "r_x3": 220.787, "r_y3": 624.104, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 106, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 110.705, "r_y0": 654.075, "r_x1": 118.953, "r_y1": 654.075, "r_x2": 118.953, "r_y2": 645.369, "r_x3": 110.705, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "D", "orig": "D", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 107, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 118.953, "r_y0": 654.998, "r_x1": 122.513, "r_y1": 654.998, "r_x2": 122.513, "r_y2": 648.904, "r_x3": 118.953, "r_y3": 648.904, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 108, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 125.779, "r_y0": 654.075, "r_x1": 133.528, "r_y1": 654.075, "r_x2": 133.528, "r_y2": 645.369, "r_x3": 125.779, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "=", "orig": "=", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 109, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 136.295, "r_y0": 654.075, "r_x1": 166.678, "r_y1": 654.075, "r_x2": 166.678, "r_y2": 645.369, "r_x3": 136.295, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "max x", "orig": "max x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 110, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 156.003, "r_y0": 653.933, "r_x1": 160.984, "r_y1": 653.933, "r_x2": 160.984, "r_y2": 645.369, "r_x3": 156.003, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 111, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 166.678, "r_y0": 654.998, "r_x1": 170.238, "r_y1": 654.998, "r_x2": 170.238, "r_y2": 648.904, "r_x3": 166.678, "r_y3": 648.904, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 112, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 170.736, "r_y0": 653.933, "r_x1": 185.678, "r_y1": 653.933, "r_x2": 185.678, "r_y2": 645.369, "r_x3": 170.736, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "} -", "orig": "} -", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 113, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 187.894, "r_y0": 654.075, "r_x1": 216.729, "r_y1": 654.075, "r_x2": 216.729, "r_y2": 645.369, "r_x3": 187.894, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "min x", "orig": "min x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 114, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 206.054, "r_y0": 653.933, "r_x1": 211.035, "r_y1": 653.933, "r_x2": 211.035, "r_y2": 645.369, "r_x3": 206.054, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 115, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 216.729, "r_y0": 654.998, "r_x1": 220.289, "r_y1": 654.998, "r_x2": 220.289, "r_y2": 648.904, "r_x3": 216.729, "r_y3": 648.904, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 116, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 220.787, "r_y0": 653.933, "r_x1": 225.768, "r_y1": 653.933, "r_x2": 225.768, "r_y2": 645.369, "r_x3": 220.787, "r_y3": 645.369, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 117, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 274.746, "r_y0": 643.706, "r_x1": 286.362, "r_y1": 643.706, "r_x2": 286.362, "r_y2": 635.154, "r_x3": 274.746, "r_y3": 635.154, "coord_origin": "TOPLEFT"}, "text": "(4)", "orig": "(4)", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "alignment = arg min c { D c } D c = max x { c } -min x { c } (4)"}, {"label": "text", "id": 7, "page_no": 11, "cluster": {"id": 7, "label": "text", "bbox": {"l": 50.112, "t": 668.016, "r": 286.362, "b": 688.841, "coord_origin": "TOPLEFT"}, "confidence": 0.9545555114746094, "cells": [{"index": 118, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 676.886, "r_x1": 74.451, "r_y1": 676.886, "r_x2": 74.451, "r_y2": 668.3340000000001, "r_x3": 50.112, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "where", "orig": "where", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 119, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.336, "r_y0": 676.722, "r_x1": 82.648, "r_y1": 676.722, "r_x2": 82.648, "r_y2": 668.016, "r_x3": 78.336, "r_y3": 668.016, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 120, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 86.533, "r_y0": 676.886, "r_x1": 93.178, "r_y1": 676.886, "r_x2": 93.178, "r_y2": 668.3340000000001, "r_x3": 86.533, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 121, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 97.063, "r_y0": 676.886, "r_x1": 123.634, "r_y1": 676.886, "r_x2": 123.634, "r_y2": 668.3340000000001, "r_x3": 97.063, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "one of", "orig": "one of", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 122, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 127.519, "r_y0": 676.58, "r_x1": 132.5, "r_y1": 676.58, "r_x2": 132.5, "r_y2": 668.016, "r_x3": 127.519, "r_y3": 668.016, "coord_origin": "TOPLEFT"}, "text": "{", "orig": "{", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 123, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 132.501, "r_y0": 676.886, "r_x1": 148.272, "r_y1": 676.886, "r_x2": 148.272, "r_y2": 668.3340000000001, "r_x3": 132.501, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "left,", "orig": "left,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 124, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 152.506, "r_y0": 676.886, "r_x1": 187.644, "r_y1": 676.886, "r_x2": 187.644, "r_y2": 668.3340000000001, "r_x3": 152.506, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "centroid,", "orig": "centroid,", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 125, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 191.878, "r_y0": 676.886, "r_x1": 210.697, "r_y1": 676.886, "r_x2": 210.697, "r_y2": 668.3340000000001, "r_x3": 191.878, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "right", "orig": "right", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 126, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 210.697, "r_y0": 676.58, "r_x1": 215.678, "r_y1": 676.58, "r_x2": 215.678, "r_y2": 668.016, "r_x3": 210.697, "r_y3": 668.016, "coord_origin": "TOPLEFT"}, "text": "}", "orig": "}", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 127, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.563, "r_y0": 676.886, "r_x1": 233.949, "r_y1": 676.886, "r_x2": 233.949, "r_y2": 668.3340000000001, "r_x3": 219.563, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "and", "orig": "and", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 128, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 237.835, "r_y0": 676.722, "r_x1": 243.529, "r_y1": 676.722, "r_x2": 243.529, "r_y2": 668.016, "r_x3": 237.835, "r_y3": 668.016, "coord_origin": "TOPLEFT"}, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 129, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 243.529, "r_y0": 677.645, "r_x1": 247.089, "r_y1": 677.645, "r_x2": 247.089, "r_y2": 671.551, "r_x3": 243.529, "r_y3": 671.551, "coord_origin": "TOPLEFT"}, "text": "c", "orig": "c", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 130, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 251.473, "r_y0": 676.886, "r_x1": 258.118, "r_y1": 676.886, "r_x2": 258.118, "r_y2": 668.3340000000001, "r_x3": 251.473, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "is", "orig": "is", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 131, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 262.003, "r_y0": 676.886, "r_x1": 286.362, "r_y1": 676.886, "r_x2": 286.362, "r_y2": 668.3340000000001, "r_x3": 262.003, "r_y3": 668.3340000000001, "coord_origin": "TOPLEFT"}, "text": "the x-", "orig": "the x-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 132, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 688.841, "r_x1": 205.887, "r_y1": 688.841, "r_x2": 205.887, "r_y2": 680.289, "r_x3": 50.112, "r_y3": 680.289, "coord_origin": "TOPLEFT"}, "text": "coordinate for the corresponding point.", "orig": "coordinate for the corresponding point.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "where c is one of { left, centroid, right } and x c is the xcoordinate for the corresponding point."}, {"label": "list_item", "id": 13, "page_no": 11, "cluster": {"id": 13, "label": "list_item", "bbox": {"l": 50.112, "t": 692.559, "r": 286.365, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.9260510206222534, "cells": [{"index": 133, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 701.111, "r_x1": 69.539, "r_y1": 701.111, "r_x2": 69.539, "r_y2": 692.559, "r_x3": 62.067, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "5.", "orig": "5.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 134, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 76.274, "r_y0": 701.111, "r_x1": 286.365, "r_y1": 701.111, "r_x2": 286.365, "r_y2": 692.559, "r_x3": 76.274, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "Use the alignment computed in step 4, to compute", "orig": "Use the alignment computed in step 4, to compute", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 135, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 713.066, "r_x1": 94.605, "r_y1": 713.066, "r_x2": 94.605, "r_y2": 704.514, "r_x3": 50.112, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "the median", "orig": "the median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 136, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 97.599, "r_y0": 712.902, "r_x1": 103.293, "r_y1": 712.902, "r_x2": 103.293, "r_y2": 704.196, "r_x3": 97.599, "r_y3": 704.196, "coord_origin": "TOPLEFT"}, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 137, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.292, "r_y0": 713.066, "r_x1": 286.365, "r_y1": 713.066, "r_x2": 286.365, "r_y2": 704.514, "r_x3": 103.292, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "-coordinate for all table columns and the me-", "orig": "-coordinate for all table columns and the me-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "5. Use the alignment computed in step 4, to compute the median x -coordinate for all table columns and the me-"}, {"label": "text", "id": 16, "page_no": 11, "cluster": {"id": 16, "label": "text", "bbox": {"l": 308.862, "t": 211.20000000000005, "r": 545.115, "b": 255.61800000000005, "coord_origin": "TOPLEFT"}, "confidence": 0.8942298889160156, "cells": [{"index": 138, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 219.75199999999995, "r_x1": 435.915, "r_y1": 219.75199999999995, "r_x2": 435.915, "r_y2": 211.20000000000005, "r_x3": 308.862, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "dian cell size for all table cells.", "orig": "dian cell size for all table cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 139, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 440.697, "r_y0": 219.75199999999995, "r_x1": 545.115, "r_y1": 219.75199999999995, "r_x2": 545.115, "r_y2": 211.20000000000005, "r_x3": 440.697, "r_y3": 211.20000000000005, "coord_origin": "TOPLEFT"}, "text": "The usage of median dur-", "orig": "The usage of median dur-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 140, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 231.70799999999997, "r_x1": 545.115, "r_y1": 231.70799999999997, "r_x2": 545.115, "r_y2": 223.15599999999995, "r_x3": 308.862, "r_y3": 223.15599999999995, "coord_origin": "TOPLEFT"}, "text": "ing the computations, helps to eliminate outliers caused by", "orig": "ing the computations, helps to eliminate outliers caused by", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 141, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 243.663, "r_x1": 545.115, "r_y1": 243.663, "r_x2": 545.115, "r_y2": 235.111, "r_x3": 308.862, "r_y3": 235.111, "coord_origin": "TOPLEFT"}, "text": "occasional column spans which are usually wider than the", "orig": "occasional column spans which are usually wider than the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 142, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 255.61800000000005, "r_x1": 339.577, "r_y1": 255.61800000000005, "r_x2": 339.577, "r_y2": 247.06600000000003, "r_x3": 308.862, "r_y3": 247.06600000000003, "coord_origin": "TOPLEFT"}, "text": "normal.", "orig": "normal.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "dian cell size for all table cells. The usage of median during the computations, helps to eliminate outliers caused by occasional column spans which are usually wider than the normal."}, {"label": "list_item", "id": 9, "page_no": 11, "cluster": {"id": 9, "label": "list_item", "bbox": {"l": 308.862, "t": 259.371, "r": 545.115, "b": 279.87800000000004, "coord_origin": "TOPLEFT"}, "confidence": 0.9423392415046692, "cells": [{"index": 143, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 267.923, "r_x1": 328.289, "r_y1": 267.923, "r_x2": 328.289, "r_y2": 259.371, "r_x3": 320.817, "r_y3": 259.371, "coord_origin": "TOPLEFT"}, "text": "6.", "orig": "6.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 144, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 334.884, "r_y0": 267.923, "r_x1": 545.115, "r_y1": 267.923, "r_x2": 545.115, "r_y2": 259.371, "r_x3": 334.884, "r_y3": 259.371, "coord_origin": "TOPLEFT"}, "text": "Snap all cells with bad IOU to their corresponding", "orig": "Snap all cells with bad IOU to their corresponding", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 145, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 279.87800000000004, "r_x1": 338.192, "r_y1": 279.87800000000004, "r_x2": 338.192, "r_y2": 271.326, "r_x3": 308.862, "r_y3": 271.326, "coord_origin": "TOPLEFT"}, "text": "median", "orig": "median", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 146, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 340.682, "r_y0": 279.71400000000006, "r_x1": 346.376, "r_y1": 279.71400000000006, "r_x2": 346.376, "r_y2": 271.00800000000004, "r_x3": 340.682, "r_y3": 271.00800000000004, "coord_origin": "TOPLEFT"}, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 147, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 346.376, "r_y0": 279.87800000000004, "r_x1": 453.723, "r_y1": 279.87800000000004, "r_x2": 453.723, "r_y2": 271.326, "r_x3": 346.376, "r_y3": 271.326, "coord_origin": "TOPLEFT"}, "text": "-coordinates and cell sizes.", "orig": "-coordinates and cell sizes.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "6. Snap all cells with bad IOU to their corresponding median x -coordinates and cell sizes."}, {"label": "list_item", "id": 6, "page_no": 11, "cluster": {"id": 6, "label": "list_item", "bbox": {"l": 308.862, "t": 283.632, "r": 545.115, "b": 387.825, "coord_origin": "TOPLEFT"}, "confidence": 0.9562004804611206, "cells": [{"index": 148, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 292.184, "r_x1": 328.289, "r_y1": 292.184, "r_x2": 328.289, "r_y2": 283.632, "r_x3": 320.817, "r_y3": 283.632, "coord_origin": "TOPLEFT"}, "text": "7.", "orig": "7.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 149, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 332.144, "r_y0": 292.184, "r_x1": 545.115, "r_y1": 292.184, "r_x2": 545.115, "r_y2": 283.632, "r_x3": 332.144, "r_y3": 283.632, "coord_origin": "TOPLEFT"}, "text": "Generate a new set of pair-wise matches between the", "orig": "Generate a new set of pair-wise matches between the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 150, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 304.139, "r_x1": 476.562, "r_y1": 304.139, "r_x2": 476.562, "r_y2": 295.587, "r_x3": 308.862, "r_y3": 295.587, "coord_origin": "TOPLEFT"}, "text": "corrected bounding boxes and PDF cells.", "orig": "corrected bounding boxes and PDF cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 151, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 482.082, "r_y0": 304.139, "r_x1": 545.115, "r_y1": 304.139, "r_x2": 545.115, "r_y2": 295.587, "r_x3": 482.082, "r_y3": 295.587, "coord_origin": "TOPLEFT"}, "text": "This time use a", "orig": "This time use a", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 152, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 316.094, "r_x1": 545.115, "r_y1": 316.094, "r_x2": 545.115, "r_y2": 307.542, "r_x3": 308.862, "r_y3": 307.542, "coord_origin": "TOPLEFT"}, "text": "modified version of the IOU metric, where the area of the", "orig": "modified version of the IOU metric, where the area of the", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 153, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 328.049, "r_x1": 545.115, "r_y1": 328.049, "r_x2": 545.115, "r_y2": 319.497, "r_x3": 308.862, "r_y3": 319.497, "coord_origin": "TOPLEFT"}, "text": "intersection between the predicted and PDF cells is divided", "orig": "intersection between the predicted and PDF cells is divided", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 154, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 340.005, "r_x1": 397.19, "r_y1": 340.005, "r_x2": 397.19, "r_y2": 331.453, "r_x3": 308.862, "r_y3": 331.453, "coord_origin": "TOPLEFT"}, "text": "by the PDF cell area.", "orig": "by the PDF cell area.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 155, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 403.656, "r_y0": 340.005, "r_x1": 545.115, "r_y1": 340.005, "r_x2": 545.115, "r_y2": 331.453, "r_x3": 403.656, "r_y3": 331.453, "coord_origin": "TOPLEFT"}, "text": "In case there are multiple matches", "orig": "In case there are multiple matches", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 156, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 351.96, "r_x1": 545.115, "r_y1": 351.96, "r_x2": 545.115, "r_y2": 343.408, "r_x3": 308.862, "r_y3": 343.408, "coord_origin": "TOPLEFT"}, "text": "for the same PDF cell, the prediction with the higher score", "orig": "for the same PDF cell, the prediction with the higher score", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 157, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 363.915, "r_x1": 357.26, "r_y1": 363.915, "r_x2": 357.26, "r_y2": 355.363, "r_x3": 308.862, "r_y3": 355.363, "coord_origin": "TOPLEFT"}, "text": "is preferred.", "orig": "is preferred.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 158, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 361.176, "r_y0": 363.915, "r_x1": 545.115, "r_y1": 363.915, "r_x2": 545.115, "r_y2": 355.363, "r_x3": 361.176, "r_y3": 355.363, "coord_origin": "TOPLEFT"}, "text": "This covers the cases where the PDF cells are", "orig": "This covers the cases where the PDF cells are", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 159, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 375.87, "r_x1": 545.115, "r_y1": 375.87, "r_x2": 545.115, "r_y2": 367.318, "r_x3": 308.862, "r_y3": 367.318, "coord_origin": "TOPLEFT"}, "text": "smaller than the area of predicted or corrected prediction", "orig": "smaller than the area of predicted or corrected prediction", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 160, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 387.825, "r_x1": 329.614, "r_y1": 387.825, "r_x2": 329.614, "r_y2": 379.273, "r_x3": 308.862, "r_y3": 379.273, "coord_origin": "TOPLEFT"}, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "7. Generate a new set of pair-wise matches between the corrected bounding boxes and PDF cells. This time use a modified version of the IOU metric, where the area of the intersection between the predicted and PDF cells is divided by the PDF cell area. In case there are multiple matches for the same PDF cell, the prediction with the higher score is preferred. This covers the cases where the PDF cells are smaller than the area of predicted or corrected prediction cells."}, {"label": "list_item", "id": 17, "page_no": 11, "cluster": {"id": 17, "label": "list_item", "bbox": {"l": 308.862, "t": 391.579, "r": 545.115, "b": 459.906, "coord_origin": "TOPLEFT"}, "confidence": 0.8719939589500427, "cells": [{"index": 161, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 400.131, "r_x1": 328.289, "r_y1": 400.131, "r_x2": 328.289, "r_y2": 391.579, "r_x3": 320.817, "r_y3": 391.579, "coord_origin": "TOPLEFT"}, "text": "8.", "orig": "8.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 162, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.569, "r_y0": 400.131, "r_x1": 545.115, "r_y1": 400.131, "r_x2": 545.115, "r_y2": 391.579, "r_x3": 333.569, "r_y3": 391.579, "coord_origin": "TOPLEFT"}, "text": "In some rare occasions, we have noticed that Table-", "orig": "In some rare occasions, we have noticed that Table-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 163, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 412.086, "r_x1": 545.115, "r_y1": 412.086, "r_x2": 545.115, "r_y2": 403.534, "r_x3": 308.862, "r_y3": 403.534, "coord_origin": "TOPLEFT"}, "text": "Former can confuse a single column as two. When the post-", "orig": "Former can confuse a single column as two. When the post-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 164, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 424.041, "r_x1": 545.115, "r_y1": 424.041, "r_x2": 545.115, "r_y2": 415.489, "r_x3": 308.862, "r_y3": 415.489, "coord_origin": "TOPLEFT"}, "text": "processing steps are applied, this results with two predicted", "orig": "processing steps are applied, this results with two predicted", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 165, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 435.996, "r_x1": 488.109, "r_y1": 435.996, "r_x2": 488.109, "r_y2": 427.444, "r_x3": 308.862, "r_y3": 427.444, "coord_origin": "TOPLEFT"}, "text": "columns pointing to the same PDF column.", "orig": "columns pointing to the same PDF column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 166, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 494.336, "r_y0": 435.996, "r_x1": 545.115, "r_y1": 435.996, "r_x2": 545.115, "r_y2": 427.444, "r_x3": 494.336, "r_y3": 427.444, "coord_origin": "TOPLEFT"}, "text": "In such case", "orig": "In such case", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 167, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 447.951, "r_x1": 545.115, "r_y1": 447.951, "r_x2": 545.115, "r_y2": 439.399, "r_x3": 308.862, "r_y3": 439.399, "coord_origin": "TOPLEFT"}, "text": "we must de-duplicate the columns according to highest to-", "orig": "we must de-duplicate the columns according to highest to-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 168, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 459.906, "r_x1": 426.182, "r_y1": 459.906, "r_x2": 426.182, "r_y2": 451.354, "r_x3": 308.862, "r_y3": 451.354, "coord_origin": "TOPLEFT"}, "text": "tal column intersection score.", "orig": "tal column intersection score.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "8. In some rare occasions, we have noticed that TableFormer can confuse a single column as two. When the postprocessing steps are applied, this results with two predicted columns pointing to the same PDF column. In such case we must de-duplicate the columns according to highest total column intersection score."}, {"label": "list_item", "id": 15, "page_no": 11, "cluster": {"id": 15, "label": "list_item", "bbox": {"l": 308.862, "t": 463.66, "r": 545.115, "b": 567.8530000000001, "coord_origin": "TOPLEFT"}, "confidence": 0.9126082062721252, "cells": [{"index": 169, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 472.212, "r_x1": 328.289, "r_y1": 472.212, "r_x2": 328.289, "r_y2": 463.66, "r_x3": 320.817, "r_y3": 463.66, "coord_origin": "TOPLEFT"}, "text": "9.", "orig": "9.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 170, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 333.629, "r_y0": 472.212, "r_x1": 478.505, "r_y1": 472.212, "r_x2": 478.505, "r_y2": 463.66, "r_x3": 333.629, "r_y3": 463.66, "coord_origin": "TOPLEFT"}, "text": "Pick up the remaining orphan cells.", "orig": "Pick up the remaining orphan cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 171, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.855, "r_y0": 472.212, "r_x1": 545.115, "r_y1": 472.212, "r_x2": 545.115, "r_y2": 463.66, "r_x3": 483.855, "r_y3": 463.66, "coord_origin": "TOPLEFT"}, "text": "There could be", "orig": "There could be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 172, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 484.167, "r_x1": 545.115, "r_y1": 484.167, "r_x2": 545.115, "r_y2": 475.615, "r_x3": 308.862, "r_y3": 475.615, "coord_origin": "TOPLEFT"}, "text": "cases, when after applying all the previous post-processing", "orig": "cases, when after applying all the previous post-processing", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 173, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 496.122, "r_x1": 545.115, "r_y1": 496.122, "r_x2": 545.115, "r_y2": 487.57, "r_x3": 308.862, "r_y3": 487.57, "coord_origin": "TOPLEFT"}, "text": "steps, some PDF cells could still remain without any match", "orig": "steps, some PDF cells could still remain without any match", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 174, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 508.077, "r_x1": 381.898, "r_y1": 508.077, "r_x2": 381.898, "r_y2": 499.525, "r_x3": 308.862, "r_y3": 499.525, "coord_origin": "TOPLEFT"}, "text": "to predicted cells.", "orig": "to predicted cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 175, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 388.702, "r_y0": 508.077, "r_x1": 545.115, "r_y1": 508.077, "r_x2": 545.115, "r_y2": 499.525, "r_x3": 388.702, "r_y3": 499.525, "coord_origin": "TOPLEFT"}, "text": "However, it is still possible to deduce", "orig": "However, it is still possible to deduce", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 176, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 520.033, "r_x1": 545.115, "r_y1": 520.033, "r_x2": 545.115, "r_y2": 511.481, "r_x3": 308.862, "r_y3": 511.481, "coord_origin": "TOPLEFT"}, "text": "the correct matching for an orphan PDF cell by mapping its", "orig": "the correct matching for an orphan PDF cell by mapping its", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 177, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 531.988, "r_x1": 483.576, "r_y1": 531.988, "r_x2": 483.576, "r_y2": 523.4359999999999, "r_x3": 308.862, "r_y3": 523.4359999999999, "coord_origin": "TOPLEFT"}, "text": "bounding box on the geometry of the grid.", "orig": "bounding box on the geometry of the grid.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 178, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 489.195, "r_y0": 531.988, "r_x1": 545.115, "r_y1": 531.988, "r_x2": 545.115, "r_y2": 523.4359999999999, "r_x3": 489.195, "r_y3": 523.4359999999999, "coord_origin": "TOPLEFT"}, "text": "This mapping", "orig": "This mapping", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 179, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 543.943, "r_x1": 545.115, "r_y1": 543.943, "r_x2": 545.115, "r_y2": 535.3910000000001, "r_x3": 308.862, "r_y3": 535.3910000000001, "coord_origin": "TOPLEFT"}, "text": "decides if the content of the orphan cell will be appended to", "orig": "decides if the content of the orphan cell will be appended to", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 180, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 555.898, "r_x1": 545.115, "r_y1": 555.898, "r_x2": 545.115, "r_y2": 547.346, "r_x3": 308.862, "r_y3": 547.346, "coord_origin": "TOPLEFT"}, "text": "an already matched table cell, or a new table cell should be", "orig": "an already matched table cell, or a new table cell should be", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 181, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 567.8530000000001, "r_x1": 442.221, "r_y1": 567.8530000000001, "r_x2": 442.221, "r_y2": 559.3009999999999, "r_x3": 308.862, "r_y3": 559.3009999999999, "coord_origin": "TOPLEFT"}, "text": "created to match with the orphan.", "orig": "created to match with the orphan.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9. Pick up the remaining orphan cells. There could be cases, when after applying all the previous post-processing steps, some PDF cells could still remain without any match to predicted cells. However, it is still possible to deduce the correct matching for an orphan PDF cell by mapping its bounding box on the geometry of the grid. This mapping decides if the content of the orphan cell will be appended to an already matched table cell, or a new table cell should be created to match with the orphan."}, {"label": "text", "id": 19, "page_no": 11, "cluster": {"id": 19, "label": "text", "bbox": {"l": 308.862, "t": 571.607, "r": 545.117, "b": 604.069, "coord_origin": "TOPLEFT"}, "confidence": 0.8459473848342896, "cells": [{"index": 182, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 580.159, "r_x1": 332.712, "r_y1": 580.159, "r_x2": 332.712, "r_y2": 571.607, "r_x3": 320.817, "r_y3": 571.607, "coord_origin": "TOPLEFT"}, "text": "9a.", "orig": "9a.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 183, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.943, "r_y0": 580.159, "r_x1": 545.115, "r_y1": 580.159, "r_x2": 545.115, "r_y2": 571.607, "r_x3": 337.943, "r_y3": 571.607, "coord_origin": "TOPLEFT"}, "text": "Compute the top and bottom boundary of the hori-", "orig": "Compute the top and bottom boundary of the hori-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 184, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 592.114, "r_x1": 471.641, "r_y1": 592.114, "r_x2": 471.641, "r_y2": 583.562, "r_x3": 308.862, "r_y3": 583.562, "coord_origin": "TOPLEFT"}, "text": "zontal band for each grid row (min/max", "orig": "zontal band for each grid row (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 185, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 474.834, "r_y0": 591.95, "r_x1": 479.719, "r_y1": 591.95, "r_x2": 479.719, "r_y2": 583.244, "r_x3": 474.834, "r_y3": 583.244, "coord_origin": "TOPLEFT"}, "text": "y", "orig": "y", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 186, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 483.269, "r_y0": 592.114, "r_x1": 545.117, "r_y1": 592.114, "r_x2": 545.117, "r_y2": 583.562, "r_x3": 483.269, "r_y3": 583.562, "coord_origin": "TOPLEFT"}, "text": "coordinates per", "orig": "coordinates per", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 187, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 604.069, "r_x1": 329.913, "r_y1": 604.069, "r_x2": 329.913, "r_y2": 595.517, "r_x3": 308.862, "r_y3": 595.517, "coord_origin": "TOPLEFT"}, "text": "row).", "orig": "row).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9a. Compute the top and bottom boundary of the horizontal band for each grid row (min/max y coordinates per row)."}, {"label": "list_item", "id": 21, "page_no": 11, "cluster": {"id": 21, "label": "list_item", "bbox": {"l": 308.862, "t": 607.822, "r": 545.115, "b": 628.33, "coord_origin": "TOPLEFT"}, "confidence": 0.7716891169548035, "cells": [{"index": 188, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 616.374, "r_x1": 332.872, "r_y1": 616.374, "r_x2": 332.872, "r_y2": 607.822, "r_x3": 320.817, "r_y3": 607.822, "coord_origin": "TOPLEFT"}, "text": "9b.", "orig": "9b.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 189, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 339.925, "r_y0": 616.374, "r_x1": 374.226, "r_y1": 616.374, "r_x2": 374.226, "r_y2": 607.822, "r_x3": 339.925, "r_y3": 607.822, "coord_origin": "TOPLEFT"}, "text": "Intersect", "orig": "Intersect", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 190, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 378.042, "r_y0": 616.374, "r_x1": 545.115, "r_y1": 616.374, "r_x2": 545.115, "r_y2": 607.822, "r_x3": 378.042, "r_y3": 607.822, "coord_origin": "TOPLEFT"}, "text": "the orphan's bounding box with the row", "orig": "the orphan's bounding box with the row", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 191, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 628.33, "r_x1": 495.292, "r_y1": 628.33, "r_x2": 495.292, "r_y2": 619.778, "r_x3": 308.862, "r_y3": 619.778, "coord_origin": "TOPLEFT"}, "text": "bands, and map the cell to the closest grid row.", "orig": "bands, and map the cell to the closest grid row.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9b. Intersect the orphan's bounding box with the row bands, and map the cell to the closest grid row."}, {"label": "list_item", "id": 18, "page_no": 11, "cluster": {"id": 18, "label": "list_item", "bbox": {"l": 308.862, "t": 632.083, "r": 545.115, "b": 664.545, "coord_origin": "TOPLEFT"}, "confidence": 0.8584907054901123, "cells": [{"index": 192, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 640.635, "r_x1": 332.712, "r_y1": 640.635, "r_x2": 332.712, "r_y2": 632.083, "r_x3": 320.817, "r_y3": 632.083, "coord_origin": "TOPLEFT"}, "text": "9c.", "orig": "9c.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 193, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 337.534, "r_y0": 640.635, "r_x1": 545.115, "r_y1": 640.635, "r_x2": 545.115, "r_y2": 632.083, "r_x3": 337.534, "r_y3": 632.083, "coord_origin": "TOPLEFT"}, "text": "Compute the left and right boundary of the vertical", "orig": "Compute the left and right boundary of the vertical", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 194, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 652.59, "r_x1": 455.282, "r_y1": 652.59, "r_x2": 455.282, "r_y2": 644.038, "r_x3": 308.862, "r_y3": 644.038, "coord_origin": "TOPLEFT"}, "text": "band for each grid column (min/max", "orig": "band for each grid column (min/max", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 195, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 457.777, "r_y0": 652.4259999999999, "r_x1": 463.471, "r_y1": 652.4259999999999, "r_x2": 463.471, "r_y2": 643.72, "r_x3": 457.777, "r_y3": 643.72, "coord_origin": "TOPLEFT"}, "text": "x", "orig": "x", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 196, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 465.971, "r_y0": 652.59, "r_x1": 545.114, "r_y1": 652.59, "r_x2": 545.114, "r_y2": 644.038, "r_x3": 465.971, "r_y3": 644.038, "coord_origin": "TOPLEFT"}, "text": "coordinates per col-", "orig": "coordinates per col-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 197, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 664.545, "r_x1": 332.384, "r_y1": 664.545, "r_x2": 332.384, "r_y2": 655.9929999999999, "r_x3": 308.862, "r_y3": 655.9929999999999, "coord_origin": "TOPLEFT"}, "text": "umn).", "orig": "umn).", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9c. Compute the left and right boundary of the vertical band for each grid column (min/max x coordinates per column)."}, {"label": "list_item", "id": 22, "page_no": 11, "cluster": {"id": 22, "label": "list_item", "bbox": {"l": 308.862, "t": 668.299, "r": 545.115, "b": 688.806, "coord_origin": "TOPLEFT"}, "confidence": 0.7590745091438293, "cells": [{"index": 198, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 676.851, "r_x1": 545.115, "r_y1": 676.851, "r_x2": 545.115, "r_y2": 668.299, "r_x3": 320.817, "r_y3": 668.299, "coord_origin": "TOPLEFT"}, "text": "9d. Intersect the orphan's bounding box with the column", "orig": "9d. Intersect the orphan's bounding box with the column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 199, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 688.806, "r_x1": 510.585, "r_y1": 688.806, "r_x2": 510.585, "r_y2": 680.254, "r_x3": 308.862, "r_y3": 680.254, "coord_origin": "TOPLEFT"}, "text": "bands, and map the cell to the closest grid column.", "orig": "bands, and map the cell to the closest grid column.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9d. Intersect the orphan's bounding box with the column bands, and map the cell to the closest grid column."}, {"label": "list_item", "id": 25, "page_no": 11, "cluster": {"id": 25, "label": "list_item", "bbox": {"l": 308.862, "t": 692.559, "r": 545.115, "b": 713.066, "coord_origin": "TOPLEFT"}, "confidence": 0.6971189975738525, "cells": [{"index": 200, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 320.817, "r_y0": 701.111, "r_x1": 545.115, "r_y1": 701.111, "r_x2": 545.115, "r_y2": 692.559, "r_x3": 320.817, "r_y3": 692.559, "coord_origin": "TOPLEFT"}, "text": "9e. If the table cell under the identified row and column", "orig": "9e. If the table cell under the identified row and column", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 201, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 713.066, "r_x1": 545.115, "r_y1": 713.066, "r_x2": 545.115, "r_y2": 704.514, "r_x3": 308.862, "r_y3": 704.514, "coord_origin": "TOPLEFT"}, "text": "is not empty, extend its content with the content of the or-", "orig": "is not empty, extend its content with the content of the or-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9e. If the table cell under the identified row and column is not empty, extend its content with the content of the or-"}], "headers": [{"label": "page_footer", "id": 14, "page_no": 11, "cluster": {"id": 14, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9126598238945007, "cells": [{"index": 202, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "12", "orig": "12", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "12"}]}}, {"page_no": 12, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 88.847, "r_y1": 84.029, "r_x2": 88.847, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "phan cell.", "orig": "phan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 95.98400000000004, "r_x1": 72.856, "r_y1": 95.98400000000004, "r_x2": 72.856, "r_y2": 87.43200000000002, "r_x3": 62.067, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "9f.", "orig": "9f.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.316, "r_y0": 95.98400000000004, "r_x1": 286.365, "r_y1": 95.98400000000004, "r_x2": 286.365, "r_y2": 87.43200000000002, "r_x3": 78.316, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "Otherwise create a new structural cell and match it", "orig": "Otherwise create a new structural cell and match it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 107.93899999999996, "r_x1": 127.033, "r_y1": 107.93899999999996, "r_x2": 127.033, "r_y2": 99.38699999999994, "r_x3": 50.112, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "wit the orphan cell.", "orig": "wit the orphan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 119.75099999999998, "r_x1": 286.365, "r_y1": 119.75099999999998, "r_x2": 286.365, "r_y2": 111.16300000000001, "r_x3": 62.067, "r_y3": 111.16300000000001, "coord_origin": "TOPLEFT"}, "text": "Aditional images with examples of TableFormer predic-", "orig": "Aditional images with examples of TableFormer predic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 131.70600000000002, "r_x1": 234.061, "r_y1": 131.70600000000002, "r_x2": 234.061, "r_y2": 123.11800000000005, "r_x3": 50.112, "r_y3": 123.11800000000005, "coord_origin": "TOPLEFT"}, "text": "tions and post-processing can be found below.", "orig": "tions and post-processing can be found below.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 63.341, "r_y0": 510.877, "r_x1": 99.595, "r_y1": 510.877, "r_x2": 99.595, "r_y2": 502.325, "r_x3": 63.341, "r_y3": 502.325, "coord_origin": "TOPLEFT"}, "text": "Figure 8:", "orig": "Figure 8:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 105.174, "r_y0": 510.877, "r_x1": 273.133, "r_y1": 510.877, "r_x2": 273.133, "r_y2": 502.325, "r_x3": 105.174, "r_y3": 502.325, "coord_origin": "TOPLEFT"}, "text": "Example of a table with multi-line header.", "orig": "Example of a table with multi-line header.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 315.419, "r_x1": 345.634, "r_y1": 315.419, "r_x2": 345.634, "r_y2": 306.867, "r_x3": 308.862, "r_y3": 306.867, "coord_origin": "TOPLEFT"}, "text": "Figure 9:", "orig": "Figure 9:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 352.787, "r_y0": 315.419, "r_x1": 545.115, "r_y1": 315.419, "r_x2": 545.115, "r_y2": 306.867, "r_x3": 352.787, "r_y3": 306.867, "coord_origin": "TOPLEFT"}, "text": "Example of a table with big empty distance be-", "orig": "Example of a table with big empty distance be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 327.374, "r_x1": 355.895, "r_y1": 327.374, "r_x2": 355.895, "r_y2": 318.822, "r_x3": 308.862, "r_y3": 318.822, "coord_origin": "TOPLEFT"}, "text": "tween cells.", "orig": "tween cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.343, "r_y0": 689.314, "r_x1": 353.578, "r_y1": 689.314, "r_x2": 353.578, "r_y2": 680.762, "r_x3": 312.343, "r_y3": 680.762, "coord_origin": "TOPLEFT"}, "text": "Figure 10:", "orig": "Figure 10:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 359.157, "r_y0": 689.314, "r_x1": 541.632, "r_y1": 689.314, "r_x2": 541.632, "r_y2": 680.762, "r_x3": 359.157, "r_y3": 680.762, "coord_origin": "TOPLEFT"}, "text": "Example of a complex table with empty cells.", "orig": "Example of a complex table with empty cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 14, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 88.847, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.7545598149299622, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 88.847, "r_y1": 84.029, "r_x2": 88.847, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "phan cell.", "orig": "phan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "text", "bbox": {"l": 50.112, "t": 87.43200000000002, "r": 286.365, "b": 107.93899999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9170762300491333, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 95.98400000000004, "r_x1": 72.856, "r_y1": 95.98400000000004, "r_x2": 72.856, "r_y2": 87.43200000000002, "r_x3": 62.067, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "9f.", "orig": "9f.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.316, "r_y0": 95.98400000000004, "r_x1": 286.365, "r_y1": 95.98400000000004, "r_x2": 286.365, "r_y2": 87.43200000000002, "r_x3": 78.316, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "Otherwise create a new structural cell and match it", "orig": "Otherwise create a new structural cell and match it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 107.93899999999996, "r_x1": 127.033, "r_y1": 107.93899999999996, "r_x2": 127.033, "r_y2": 99.38699999999994, "r_x3": 50.112, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "wit the orphan cell.", "orig": "wit the orphan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "text", "bbox": {"l": 50.112, "t": 111.16300000000001, "r": 286.365, "b": 131.70600000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9454683065414429, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 119.75099999999998, "r_x1": 286.365, "r_y1": 119.75099999999998, "r_x2": 286.365, "r_y2": 111.16300000000001, "r_x3": 62.067, "r_y3": 111.16300000000001, "coord_origin": "TOPLEFT"}, "text": "Aditional images with examples of TableFormer predic-", "orig": "Aditional images with examples of TableFormer predic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 131.70600000000002, "r_x1": 234.061, "r_y1": 131.70600000000002, "r_x2": 234.061, "r_y2": 123.11800000000005, "r_x3": 50.112, "r_y3": 123.11800000000005, "coord_origin": "TOPLEFT"}, "text": "tions and post-processing can be found below.", "orig": "tions and post-processing can be found below.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 8, "label": "caption", "bbox": {"l": 63.341, "t": 502.325, "r": 273.133, "b": 510.877, "coord_origin": "TOPLEFT"}, "confidence": 0.8971090316772461, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 63.341, "r_y0": 510.877, "r_x1": 99.595, "r_y1": 510.877, "r_x2": 99.595, "r_y2": 502.325, "r_x3": 63.341, "r_y3": 502.325, "coord_origin": "TOPLEFT"}, "text": "Figure 8:", "orig": "Figure 8:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 105.174, "r_y0": 510.877, "r_x1": 273.133, "r_y1": 510.877, "r_x2": 273.133, "r_y2": 502.325, "r_x3": 105.174, "r_y3": 502.325, "coord_origin": "TOPLEFT"}, "text": "Example of a table with multi-line header.", "orig": "Example of a table with multi-line header.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 11, "label": "caption", "bbox": {"l": 308.862, "t": 306.867, "r": 545.115, "b": 327.374, "coord_origin": "TOPLEFT"}, "confidence": 0.8773345351219177, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 315.419, "r_x1": 345.634, "r_y1": 315.419, "r_x2": 345.634, "r_y2": 306.867, "r_x3": 308.862, "r_y3": 306.867, "coord_origin": "TOPLEFT"}, "text": "Figure 9:", "orig": "Figure 9:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 352.787, "r_y0": 315.419, "r_x1": 545.115, "r_y1": 315.419, "r_x2": 545.115, "r_y2": 306.867, "r_x3": 352.787, "r_y3": 306.867, "coord_origin": "TOPLEFT"}, "text": "Example of a table with big empty distance be-", "orig": "Example of a table with big empty distance be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 327.374, "r_x1": 355.895, "r_y1": 327.374, "r_x2": 355.895, "r_y2": 318.822, "r_x3": 308.862, "r_y3": 318.822, "coord_origin": "TOPLEFT"}, "text": "tween cells.", "orig": "tween cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "caption", "bbox": {"l": 312.343, "t": 680.762, "r": 541.632, "b": 689.314, "coord_origin": "TOPLEFT"}, "confidence": 0.9188510179519653, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.343, "r_y0": 689.314, "r_x1": 353.578, "r_y1": 689.314, "r_x2": 353.578, "r_y2": 680.762, "r_x3": 312.343, "r_y3": 680.762, "coord_origin": "TOPLEFT"}, "text": "Figure 10:", "orig": "Figure 10:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 359.157, "r_y0": 689.314, "r_x1": 541.632, "r_y1": 689.314, "r_x2": 541.632, "r_y2": 680.762, "r_x3": 359.157, "r_y3": 680.762, "coord_origin": "TOPLEFT"}, "text": "Example of a complex table with empty cells.", "orig": "Example of a complex table with empty cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 7, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9020507335662842, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 17, "label": "table", "bbox": {"l": 310.3294372558594, "t": 101.17767333984375, "r": 555.8338623046875, "b": 136.14752197265625, "coord_origin": "TOPLEFT"}, "confidence": 0.70481276512146, "cells": [], "children": []}, {"id": 32, "label": "table", "bbox": {"l": 309.9566345214844, "t": 154.61448669433594, "r": 555.7466430664062, "b": 184.7225341796875, "coord_origin": "TOPLEFT"}, "confidence": 0.564289927482605, "cells": [], "children": []}, {"id": 9, "label": "table", "bbox": {"l": 84.0283203125, "t": 156.3335418701172, "r": 239.1690673828125, "b": 214.39334106445312, "coord_origin": "TOPLEFT"}, "confidence": 0.8857279419898987, "cells": [], "children": []}, {"id": 21, "label": "table", "bbox": {"l": 309.9635314941406, "t": 195.70541381835938, "r": 555.7054443359375, "b": 233.55145263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.6602518558502197, "cells": [], "children": []}, {"id": 4, "label": "table", "bbox": {"l": 82.92001342773438, "t": 233.7763214111328, "r": 239.1903533935547, "b": 291.283935546875, "coord_origin": "TOPLEFT"}, "confidence": 0.9155725836753845, "cells": [], "children": []}, {"id": 19, "label": "picture", "bbox": {"l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT"}, "confidence": 0.6956620812416077, "cells": [], "children": []}, {"id": 37, "label": "table", "bbox": {"l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT"}, "confidence": 0.52826988697052, "cells": [], "children": []}, {"id": 6, "label": "table", "bbox": {"l": 83.94786071777344, "t": 309.0477294921875, "r": 239.17135620117188, "b": 367.9095764160156, "coord_origin": "TOPLEFT"}, "confidence": 0.9085132479667664, "cells": [], "children": []}, {"id": 12, "label": "table", "bbox": {"l": 335.2694091796875, "t": 388.46746826171875, "r": 490.081787109375, "b": 437.02239990234375, "coord_origin": "TOPLEFT"}, "confidence": 0.8486077189445496, "cells": [], "children": []}, {"id": 0, "label": "table", "bbox": {"l": 83.31756591796875, "t": 396.0135498046875, "r": 248.873046875, "b": 487.2569885253906, "coord_origin": "TOPLEFT"}, "confidence": 0.9613965749740601, "cells": [], "children": []}, {"id": 10, "label": "table", "bbox": {"l": 334.9334716796875, "t": 453.9476318359375, "r": 490.0914306640625, "b": 502.7210998535156, "coord_origin": "TOPLEFT"}, "confidence": 0.8815538287162781, "cells": [], "children": []}, {"id": 5, "label": "table", "bbox": {"l": 335.2545471191406, "t": 519.07568359375, "r": 490.22369384765625, "b": 567.6879272460938, "coord_origin": "TOPLEFT"}, "confidence": 0.9096733927726746, "cells": [], "children": []}, {"id": 13, "label": "picture", "bbox": {"l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT"}, "confidence": 0.8023569583892822, "cells": [], "children": []}, {"id": 30, "label": "table", "bbox": {"l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT"}, "confidence": 0.5930293798446655, "cells": [], "children": []}]}, "tablestructure": {"table_map": {"17": {"label": "table", "id": 17, "page_no": 12, "cluster": {"id": 17, "label": "table", "bbox": {"l": 310.3294372558594, "t": 101.17767333984375, "r": 555.8338623046875, "b": 136.14752197265625, "coord_origin": "TOPLEFT"}, "confidence": 0.70481276512146, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "32": {"label": "table", "id": 32, "page_no": 12, "cluster": {"id": 32, "label": "table", "bbox": {"l": 309.9566345214844, "t": 154.61448669433594, "r": 555.7466430664062, "b": 184.7225341796875, "coord_origin": "TOPLEFT"}, "confidence": 0.564289927482605, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "9": {"label": "table", "id": 9, "page_no": 12, "cluster": {"id": 9, "label": "table", "bbox": {"l": 84.0283203125, "t": 156.3335418701172, "r": 239.1690673828125, "b": 214.39334106445312, "coord_origin": "TOPLEFT"}, "confidence": 0.8857279419898987, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "21": {"label": "table", "id": 21, "page_no": 12, "cluster": {"id": 21, "label": "table", "bbox": {"l": 309.9635314941406, "t": 195.70541381835938, "r": 555.7054443359375, "b": 233.55145263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.6602518558502197, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "4": {"label": "table", "id": 4, "page_no": 12, "cluster": {"id": 4, "label": "table", "bbox": {"l": 82.92001342773438, "t": 233.7763214111328, "r": 239.1903533935547, "b": 291.283935546875, "coord_origin": "TOPLEFT"}, "confidence": 0.9155725836753845, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "37": {"label": "table", "id": 37, "page_no": 12, "cluster": {"id": 37, "label": "table", "bbox": {"l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT"}, "confidence": 0.52826988697052, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "lcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "6": {"label": "table", "id": 6, "page_no": 12, "cluster": {"id": 6, "label": "table", "bbox": {"l": 83.94786071777344, "t": 309.0477294921875, "r": 239.17135620117188, "b": 367.9095764160156, "coord_origin": "TOPLEFT"}, "confidence": 0.9085132479667664, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "12": {"label": "table", "id": 12, "page_no": 12, "cluster": {"id": 12, "label": "table", "bbox": {"l": 335.2694091796875, "t": 388.46746826171875, "r": 490.081787109375, "b": 437.02239990234375, "coord_origin": "TOPLEFT"}, "confidence": 0.8486077189445496, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "0": {"label": "table", "id": 0, "page_no": 12, "cluster": {"id": 0, "label": "table", "bbox": {"l": 83.31756591796875, "t": 396.0135498046875, "r": 248.873046875, "b": 487.2569885253906, "coord_origin": "TOPLEFT"}, "confidence": 0.9613965749740601, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "10": {"label": "table", "id": 10, "page_no": 12, "cluster": {"id": 10, "label": "table", "bbox": {"l": 334.9334716796875, "t": 453.9476318359375, "r": 490.0914306640625, "b": 502.7210998535156, "coord_origin": "TOPLEFT"}, "confidence": 0.8815538287162781, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "lcel", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "5": {"label": "table", "id": 5, "page_no": 12, "cluster": {"id": 5, "label": "table", "bbox": {"l": 335.2545471191406, "t": 519.07568359375, "r": 490.22369384765625, "b": 567.6879272460938, "coord_origin": "TOPLEFT"}, "confidence": 0.9096733927726746, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "30": {"label": "table", "id": 30, "page_no": 12, "cluster": {"id": 30, "label": "table", "bbox": {"l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT"}, "confidence": 0.5930293798446655, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "text", "id": 14, "page_no": 12, "cluster": {"id": 14, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 88.847, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.7545598149299622, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 88.847, "r_y1": 84.029, "r_x2": 88.847, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "phan cell.", "orig": "phan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "phan cell."}, {"label": "text", "id": 3, "page_no": 12, "cluster": {"id": 3, "label": "text", "bbox": {"l": 50.112, "t": 87.43200000000002, "r": 286.365, "b": 107.93899999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9170762300491333, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 95.98400000000004, "r_x1": 72.856, "r_y1": 95.98400000000004, "r_x2": 72.856, "r_y2": 87.43200000000002, "r_x3": 62.067, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "9f.", "orig": "9f.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.316, "r_y0": 95.98400000000004, "r_x1": 286.365, "r_y1": 95.98400000000004, "r_x2": 286.365, "r_y2": 87.43200000000002, "r_x3": 78.316, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "Otherwise create a new structural cell and match it", "orig": "Otherwise create a new structural cell and match it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 107.93899999999996, "r_x1": 127.033, "r_y1": 107.93899999999996, "r_x2": 127.033, "r_y2": 99.38699999999994, "r_x3": 50.112, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "wit the orphan cell.", "orig": "wit the orphan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9f. Otherwise create a new structural cell and match it wit the orphan cell."}, {"label": "text", "id": 1, "page_no": 12, "cluster": {"id": 1, "label": "text", "bbox": {"l": 50.112, "t": 111.16300000000001, "r": 286.365, "b": 131.70600000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9454683065414429, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 119.75099999999998, "r_x1": 286.365, "r_y1": 119.75099999999998, "r_x2": 286.365, "r_y2": 111.16300000000001, "r_x3": 62.067, "r_y3": 111.16300000000001, "coord_origin": "TOPLEFT"}, "text": "Aditional images with examples of TableFormer predic-", "orig": "Aditional images with examples of TableFormer predic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 131.70600000000002, "r_x1": 234.061, "r_y1": 131.70600000000002, "r_x2": 234.061, "r_y2": 123.11800000000005, "r_x3": 50.112, "r_y3": 123.11800000000005, "coord_origin": "TOPLEFT"}, "text": "tions and post-processing can be found below.", "orig": "tions and post-processing can be found below.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Aditional images with examples of TableFormer predictions and post-processing can be found below."}, {"label": "caption", "id": 8, "page_no": 12, "cluster": {"id": 8, "label": "caption", "bbox": {"l": 63.341, "t": 502.325, "r": 273.133, "b": 510.877, "coord_origin": "TOPLEFT"}, "confidence": 0.8971090316772461, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 63.341, "r_y0": 510.877, "r_x1": 99.595, "r_y1": 510.877, "r_x2": 99.595, "r_y2": 502.325, "r_x3": 63.341, "r_y3": 502.325, "coord_origin": "TOPLEFT"}, "text": "Figure 8:", "orig": "Figure 8:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 105.174, "r_y0": 510.877, "r_x1": 273.133, "r_y1": 510.877, "r_x2": 273.133, "r_y2": 502.325, "r_x3": 105.174, "r_y3": 502.325, "coord_origin": "TOPLEFT"}, "text": "Example of a table with multi-line header.", "orig": "Example of a table with multi-line header.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 8: Example of a table with multi-line header."}, {"label": "caption", "id": 11, "page_no": 12, "cluster": {"id": 11, "label": "caption", "bbox": {"l": 308.862, "t": 306.867, "r": 545.115, "b": 327.374, "coord_origin": "TOPLEFT"}, "confidence": 0.8773345351219177, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 315.419, "r_x1": 345.634, "r_y1": 315.419, "r_x2": 345.634, "r_y2": 306.867, "r_x3": 308.862, "r_y3": 306.867, "coord_origin": "TOPLEFT"}, "text": "Figure 9:", "orig": "Figure 9:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 352.787, "r_y0": 315.419, "r_x1": 545.115, "r_y1": 315.419, "r_x2": 545.115, "r_y2": 306.867, "r_x3": 352.787, "r_y3": 306.867, "coord_origin": "TOPLEFT"}, "text": "Example of a table with big empty distance be-", "orig": "Example of a table with big empty distance be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 327.374, "r_x1": 355.895, "r_y1": 327.374, "r_x2": 355.895, "r_y2": 318.822, "r_x3": 308.862, "r_y3": 318.822, "coord_origin": "TOPLEFT"}, "text": "tween cells.", "orig": "tween cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 9: Example of a table with big empty distance between cells."}, {"label": "caption", "id": 2, "page_no": 12, "cluster": {"id": 2, "label": "caption", "bbox": {"l": 312.343, "t": 680.762, "r": 541.632, "b": 689.314, "coord_origin": "TOPLEFT"}, "confidence": 0.9188510179519653, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.343, "r_y0": 689.314, "r_x1": 353.578, "r_y1": 689.314, "r_x2": 353.578, "r_y2": 680.762, "r_x3": 312.343, "r_y3": 680.762, "coord_origin": "TOPLEFT"}, "text": "Figure 10:", "orig": "Figure 10:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 359.157, "r_y0": 689.314, "r_x1": 541.632, "r_y1": 689.314, "r_x2": 541.632, "r_y2": 680.762, "r_x3": 359.157, "r_y3": 680.762, "coord_origin": "TOPLEFT"}, "text": "Example of a complex table with empty cells.", "orig": "Example of a complex table with empty cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 10: Example of a complex table with empty cells."}, {"label": "page_footer", "id": 7, "page_no": 12, "cluster": {"id": 7, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9020507335662842, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "13"}, {"label": "table", "id": 17, "page_no": 12, "cluster": {"id": 17, "label": "table", "bbox": {"l": 310.3294372558594, "t": 101.17767333984375, "r": 555.8338623046875, "b": 136.14752197265625, "coord_origin": "TOPLEFT"}, "confidence": 0.70481276512146, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 32, "page_no": 12, "cluster": {"id": 32, "label": "table", "bbox": {"l": 309.9566345214844, "t": 154.61448669433594, "r": 555.7466430664062, "b": 184.7225341796875, "coord_origin": "TOPLEFT"}, "confidence": 0.564289927482605, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 9, "page_no": 12, "cluster": {"id": 9, "label": "table", "bbox": {"l": 84.0283203125, "t": 156.3335418701172, "r": 239.1690673828125, "b": 214.39334106445312, "coord_origin": "TOPLEFT"}, "confidence": 0.8857279419898987, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 21, "page_no": 12, "cluster": {"id": 21, "label": "table", "bbox": {"l": 309.9635314941406, "t": 195.70541381835938, "r": 555.7054443359375, "b": 233.55145263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.6602518558502197, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 4, "page_no": 12, "cluster": {"id": 4, "label": "table", "bbox": {"l": 82.92001342773438, "t": 233.7763214111328, "r": 239.1903533935547, "b": 291.283935546875, "coord_origin": "TOPLEFT"}, "confidence": 0.9155725836753845, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 19, "page_no": 12, "cluster": {"id": 19, "label": "picture", "bbox": {"l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT"}, "confidence": 0.6956620812416077, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 37, "page_no": 12, "cluster": {"id": 37, "label": "table", "bbox": {"l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT"}, "confidence": 0.52826988697052, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "lcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 6, "page_no": 12, "cluster": {"id": 6, "label": "table", "bbox": {"l": 83.94786071777344, "t": 309.0477294921875, "r": 239.17135620117188, "b": 367.9095764160156, "coord_origin": "TOPLEFT"}, "confidence": 0.9085132479667664, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 12, "page_no": 12, "cluster": {"id": 12, "label": "table", "bbox": {"l": 335.2694091796875, "t": 388.46746826171875, "r": 490.081787109375, "b": 437.02239990234375, "coord_origin": "TOPLEFT"}, "confidence": 0.8486077189445496, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 0, "page_no": 12, "cluster": {"id": 0, "label": "table", "bbox": {"l": 83.31756591796875, "t": 396.0135498046875, "r": 248.873046875, "b": 487.2569885253906, "coord_origin": "TOPLEFT"}, "confidence": 0.9613965749740601, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 10, "page_no": 12, "cluster": {"id": 10, "label": "table", "bbox": {"l": 334.9334716796875, "t": 453.9476318359375, "r": 490.0914306640625, "b": 502.7210998535156, "coord_origin": "TOPLEFT"}, "confidence": 0.8815538287162781, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "lcel", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 5, "page_no": 12, "cluster": {"id": 5, "label": "table", "bbox": {"l": 335.2545471191406, "t": 519.07568359375, "r": 490.22369384765625, "b": 567.6879272460938, "coord_origin": "TOPLEFT"}, "confidence": 0.9096733927726746, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 13, "page_no": 12, "cluster": {"id": 13, "label": "picture", "bbox": {"l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT"}, "confidence": 0.8023569583892822, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 30, "page_no": 12, "cluster": {"id": 30, "label": "table", "bbox": {"l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT"}, "confidence": 0.5930293798446655, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}], "body": [{"label": "text", "id": 14, "page_no": 12, "cluster": {"id": 14, "label": "text", "bbox": {"l": 50.112, "t": 75.47699999999998, "r": 88.847, "b": 84.029, "coord_origin": "TOPLEFT"}, "confidence": 0.7545598149299622, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 84.029, "r_x1": 88.847, "r_y1": 84.029, "r_x2": 88.847, "r_y2": 75.47699999999998, "r_x3": 50.112, "r_y3": 75.47699999999998, "coord_origin": "TOPLEFT"}, "text": "phan cell.", "orig": "phan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "phan cell."}, {"label": "text", "id": 3, "page_no": 12, "cluster": {"id": 3, "label": "text", "bbox": {"l": 50.112, "t": 87.43200000000002, "r": 286.365, "b": 107.93899999999996, "coord_origin": "TOPLEFT"}, "confidence": 0.9170762300491333, "cells": [{"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 95.98400000000004, "r_x1": 72.856, "r_y1": 95.98400000000004, "r_x2": 72.856, "r_y2": 87.43200000000002, "r_x3": 62.067, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "9f.", "orig": "9f.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 78.316, "r_y0": 95.98400000000004, "r_x1": 286.365, "r_y1": 95.98400000000004, "r_x2": 286.365, "r_y2": 87.43200000000002, "r_x3": 78.316, "r_y3": 87.43200000000002, "coord_origin": "TOPLEFT"}, "text": "Otherwise create a new structural cell and match it", "orig": "Otherwise create a new structural cell and match it", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 107.93899999999996, "r_x1": 127.033, "r_y1": 107.93899999999996, "r_x2": 127.033, "r_y2": 99.38699999999994, "r_x3": 50.112, "r_y3": 99.38699999999994, "coord_origin": "TOPLEFT"}, "text": "wit the orphan cell.", "orig": "wit the orphan cell.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "9f. Otherwise create a new structural cell and match it wit the orphan cell."}, {"label": "text", "id": 1, "page_no": 12, "cluster": {"id": 1, "label": "text", "bbox": {"l": 50.112, "t": 111.16300000000001, "r": 286.365, "b": 131.70600000000002, "coord_origin": "TOPLEFT"}, "confidence": 0.9454683065414429, "cells": [{"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 62.067, "r_y0": 119.75099999999998, "r_x1": 286.365, "r_y1": 119.75099999999998, "r_x2": 286.365, "r_y2": 111.16300000000001, "r_x3": 62.067, "r_y3": 111.16300000000001, "coord_origin": "TOPLEFT"}, "text": "Aditional images with examples of TableFormer predic-", "orig": "Aditional images with examples of TableFormer predic-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 131.70600000000002, "r_x1": 234.061, "r_y1": 131.70600000000002, "r_x2": 234.061, "r_y2": 123.11800000000005, "r_x3": 50.112, "r_y3": 123.11800000000005, "coord_origin": "TOPLEFT"}, "text": "tions and post-processing can be found below.", "orig": "tions and post-processing can be found below.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Aditional images with examples of TableFormer predictions and post-processing can be found below."}, {"label": "caption", "id": 8, "page_no": 12, "cluster": {"id": 8, "label": "caption", "bbox": {"l": 63.341, "t": 502.325, "r": 273.133, "b": 510.877, "coord_origin": "TOPLEFT"}, "confidence": 0.8971090316772461, "cells": [{"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 63.341, "r_y0": 510.877, "r_x1": 99.595, "r_y1": 510.877, "r_x2": 99.595, "r_y2": 502.325, "r_x3": 63.341, "r_y3": 502.325, "coord_origin": "TOPLEFT"}, "text": "Figure 8:", "orig": "Figure 8:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 105.174, "r_y0": 510.877, "r_x1": 273.133, "r_y1": 510.877, "r_x2": 273.133, "r_y2": 502.325, "r_x3": 105.174, "r_y3": 502.325, "coord_origin": "TOPLEFT"}, "text": "Example of a table with multi-line header.", "orig": "Example of a table with multi-line header.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 8: Example of a table with multi-line header."}, {"label": "caption", "id": 11, "page_no": 12, "cluster": {"id": 11, "label": "caption", "bbox": {"l": 308.862, "t": 306.867, "r": 545.115, "b": 327.374, "coord_origin": "TOPLEFT"}, "confidence": 0.8773345351219177, "cells": [{"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 315.419, "r_x1": 345.634, "r_y1": 315.419, "r_x2": 345.634, "r_y2": 306.867, "r_x3": 308.862, "r_y3": 306.867, "coord_origin": "TOPLEFT"}, "text": "Figure 9:", "orig": "Figure 9:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 352.787, "r_y0": 315.419, "r_x1": 545.115, "r_y1": 315.419, "r_x2": 545.115, "r_y2": 306.867, "r_x3": 352.787, "r_y3": 306.867, "coord_origin": "TOPLEFT"}, "text": "Example of a table with big empty distance be-", "orig": "Example of a table with big empty distance be-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 327.374, "r_x1": 355.895, "r_y1": 327.374, "r_x2": 355.895, "r_y2": 318.822, "r_x3": 308.862, "r_y3": 318.822, "coord_origin": "TOPLEFT"}, "text": "tween cells.", "orig": "tween cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 9: Example of a table with big empty distance between cells."}, {"label": "caption", "id": 2, "page_no": 12, "cluster": {"id": 2, "label": "caption", "bbox": {"l": 312.343, "t": 680.762, "r": 541.632, "b": 689.314, "coord_origin": "TOPLEFT"}, "confidence": 0.9188510179519653, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 312.343, "r_y0": 689.314, "r_x1": 353.578, "r_y1": 689.314, "r_x2": 353.578, "r_y2": 680.762, "r_x3": 312.343, "r_y3": 680.762, "coord_origin": "TOPLEFT"}, "text": "Figure 10:", "orig": "Figure 10:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 12, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 359.157, "r_y0": 689.314, "r_x1": 541.632, "r_y1": 689.314, "r_x2": 541.632, "r_y2": 680.762, "r_x3": 359.157, "r_y3": 680.762, "coord_origin": "TOPLEFT"}, "text": "Example of a complex table with empty cells.", "orig": "Example of a complex table with empty cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 10: Example of a complex table with empty cells."}, {"label": "table", "id": 17, "page_no": 12, "cluster": {"id": 17, "label": "table", "bbox": {"l": 310.3294372558594, "t": 101.17767333984375, "r": 555.8338623046875, "b": 136.14752197265625, "coord_origin": "TOPLEFT"}, "confidence": 0.70481276512146, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 32, "page_no": 12, "cluster": {"id": 32, "label": "table", "bbox": {"l": 309.9566345214844, "t": 154.61448669433594, "r": 555.7466430664062, "b": 184.7225341796875, "coord_origin": "TOPLEFT"}, "confidence": 0.564289927482605, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 9, "page_no": 12, "cluster": {"id": 9, "label": "table", "bbox": {"l": 84.0283203125, "t": 156.3335418701172, "r": 239.1690673828125, "b": 214.39334106445312, "coord_origin": "TOPLEFT"}, "confidence": 0.8857279419898987, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 21, "page_no": 12, "cluster": {"id": 21, "label": "table", "bbox": {"l": 309.9635314941406, "t": 195.70541381835938, "r": 555.7054443359375, "b": 233.55145263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.6602518558502197, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 4, "page_no": 12, "cluster": {"id": 4, "label": "table", "bbox": {"l": 82.92001342773438, "t": 233.7763214111328, "r": 239.1903533935547, "b": 291.283935546875, "coord_origin": "TOPLEFT"}, "confidence": 0.9155725836753845, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 19, "page_no": 12, "cluster": {"id": 19, "label": "picture", "bbox": {"l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT"}, "confidence": 0.6956620812416077, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 37, "page_no": 12, "cluster": {"id": 37, "label": "table", "bbox": {"l": 309.79150390625, "t": 253.90536499023438, "r": 425.9603271484375, "b": 292.39398193359375, "coord_origin": "TOPLEFT"}, "confidence": 0.52826988697052, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "lcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 6, "page_no": 12, "cluster": {"id": 6, "label": "table", "bbox": {"l": 83.94786071777344, "t": 309.0477294921875, "r": 239.17135620117188, "b": 367.9095764160156, "coord_origin": "TOPLEFT"}, "confidence": 0.9085132479667664, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 12, "page_no": 12, "cluster": {"id": 12, "label": "table", "bbox": {"l": 335.2694091796875, "t": 388.46746826171875, "r": 490.081787109375, "b": 437.02239990234375, "coord_origin": "TOPLEFT"}, "confidence": 0.8486077189445496, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 0, "page_no": 12, "cluster": {"id": 0, "label": "table", "bbox": {"l": 83.31756591796875, "t": 396.0135498046875, "r": 248.873046875, "b": 487.2569885253906, "coord_origin": "TOPLEFT"}, "confidence": 0.9613965749740601, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 10, "page_no": 12, "cluster": {"id": 10, "label": "table", "bbox": {"l": 334.9334716796875, "t": 453.9476318359375, "r": 490.0914306640625, "b": 502.7210998535156, "coord_origin": "TOPLEFT"}, "confidence": 0.8815538287162781, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "lcel", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 5, "page_no": 12, "cluster": {"id": 5, "label": "table", "bbox": {"l": 335.2545471191406, "t": 519.07568359375, "r": 490.22369384765625, "b": 567.6879272460938, "coord_origin": "TOPLEFT"}, "confidence": 0.9096733927726746, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "lcel", "lcel", "lcel", "lcel", "nl", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 13, "page_no": 12, "cluster": {"id": 13, "label": "picture", "bbox": {"l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT"}, "confidence": 0.8023569583892822, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 30, "page_no": 12, "cluster": {"id": 30, "label": "table", "bbox": {"l": 333.9573669433594, "t": 593.1134033203125, "r": 518.4768676757812, "b": 665.4903564453125, "coord_origin": "TOPLEFT"}, "confidence": 0.5930293798446655, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}], "headers": [{"label": "page_footer", "id": 7, "page_no": 12, "cluster": {"id": 7, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9020507335662842, "cells": [{"index": 13, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "13", "orig": "13", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "13"}]}}, {"page_no": 13, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 365.591, "r_x1": 93.051, "r_y1": 365.591, "r_x2": 93.051, "r_y2": 357.039, "r_x3": 50.112, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "Figure 11:", "orig": "Figure 11:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.731, "r_y0": 365.591, "r_x1": 215.67, "r_y1": 365.591, "r_x2": 215.67, "r_y2": 357.039, "r_x3": 103.731, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "Simple table with different", "orig": "Simple table with different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.865, "r_y0": 365.591, "r_x1": 238.684, "r_y1": 365.591, "r_x2": 238.684, "r_y2": 357.039, "r_x3": 219.865, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "style", "orig": "style", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.878, "r_y0": 365.591, "r_x1": 286.365, "r_y1": 365.591, "r_x2": 286.365, "r_y2": 357.039, "r_x3": 242.878, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "and empty", "orig": "and empty", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 377.546, "r_x1": 70.864, "r_y1": 377.546, "r_x2": 70.864, "r_y2": 368.994, "r_x3": 50.112, "r_y3": 368.994, "coord_origin": "TOPLEFT"}, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.619, "r_y0": 680.639, "r_x1": 95.854, "r_y1": 680.639, "r_x2": 95.854, "r_y2": 672.087, "r_x3": 54.619, "r_y3": 672.087, "coord_origin": "TOPLEFT"}, "text": "Figure 12:", "orig": "Figure 12:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.433, "r_y0": 680.639, "r_x1": 281.856, "r_y1": 680.639, "r_x2": 281.856, "r_y2": 672.087, "r_x3": 101.433, "r_y3": 672.087, "coord_origin": "TOPLEFT"}, "text": "Simple table predictions and post processing.", "orig": "Simple table predictions and post processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.79, "r_y0": 380.505, "r_x1": 357.025, "r_y1": 380.505, "r_x2": 357.025, "r_y2": 371.953, "r_x3": 315.79, "r_y3": 371.953, "coord_origin": "TOPLEFT"}, "text": "Figure 13:", "orig": "Figure 13:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.604, "r_y0": 380.505, "r_x1": 538.185, "r_y1": 380.505, "r_x2": 538.185, "r_y2": 371.953, "r_x3": 362.604, "r_y3": 371.953, "coord_origin": "TOPLEFT"}, "text": "Table predictions example on colorful table.", "orig": "Table predictions example on colorful table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 344.985, "r_y0": 692.367, "r_x1": 386.22, "r_y1": 692.367, "r_x2": 386.22, "r_y2": 683.815, "r_x3": 344.985, "r_y3": 683.815, "coord_origin": "TOPLEFT"}, "text": "Figure 14:", "orig": "Figure 14:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.799, "r_y0": 692.367, "r_x1": 508.989, "r_y1": 692.367, "r_x2": 508.989, "r_y2": 683.815, "r_x3": 391.799, "r_y3": 683.815, "coord_origin": "TOPLEFT"}, "text": "Example with multi-line text.", "orig": "Example with multi-line text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 0, "label": "caption", "bbox": {"l": 50.112, "t": 357.039, "r": 286.365, "b": 377.546, "coord_origin": "TOPLEFT"}, "confidence": 0.951069176197052, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 365.591, "r_x1": 93.051, "r_y1": 365.591, "r_x2": 93.051, "r_y2": 357.039, "r_x3": 50.112, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "Figure 11:", "orig": "Figure 11:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.731, "r_y0": 365.591, "r_x1": 215.67, "r_y1": 365.591, "r_x2": 215.67, "r_y2": 357.039, "r_x3": 103.731, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "Simple table with different", "orig": "Simple table with different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.865, "r_y0": 365.591, "r_x1": 238.684, "r_y1": 365.591, "r_x2": 238.684, "r_y2": 357.039, "r_x3": 219.865, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "style", "orig": "style", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.878, "r_y0": 365.591, "r_x1": 286.365, "r_y1": 365.591, "r_x2": 286.365, "r_y2": 357.039, "r_x3": 242.878, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "and empty", "orig": "and empty", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 377.546, "r_x1": 70.864, "r_y1": 377.546, "r_x2": 70.864, "r_y2": 368.994, "r_x3": 50.112, "r_y3": 368.994, "coord_origin": "TOPLEFT"}, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "caption", "bbox": {"l": 54.619, "t": 672.087, "r": 281.856, "b": 680.639, "coord_origin": "TOPLEFT"}, "confidence": 0.926384687423706, "cells": [{"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.619, "r_y0": 680.639, "r_x1": 95.854, "r_y1": 680.639, "r_x2": 95.854, "r_y2": 672.087, "r_x3": 54.619, "r_y3": 672.087, "coord_origin": "TOPLEFT"}, "text": "Figure 12:", "orig": "Figure 12:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.433, "r_y0": 680.639, "r_x1": 281.856, "r_y1": 680.639, "r_x2": 281.856, "r_y2": 672.087, "r_x3": 101.433, "r_y3": 672.087, "coord_origin": "TOPLEFT"}, "text": "Simple table predictions and post processing.", "orig": "Simple table predictions and post processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "caption", "bbox": {"l": 315.79, "t": 371.953, "r": 538.185, "b": 380.505, "coord_origin": "TOPLEFT"}, "confidence": 0.9178510904312134, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.79, "r_y0": 380.505, "r_x1": 357.025, "r_y1": 380.505, "r_x2": 357.025, "r_y2": 371.953, "r_x3": 315.79, "r_y3": 371.953, "coord_origin": "TOPLEFT"}, "text": "Figure 13:", "orig": "Figure 13:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.604, "r_y0": 380.505, "r_x1": 538.185, "r_y1": 380.505, "r_x2": 538.185, "r_y2": 371.953, "r_x3": 362.604, "r_y3": 371.953, "coord_origin": "TOPLEFT"}, "text": "Table predictions example on colorful table.", "orig": "Table predictions example on colorful table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "caption", "bbox": {"l": 344.985, "t": 683.815, "r": 508.989, "b": 692.367, "coord_origin": "TOPLEFT"}, "confidence": 0.9191023111343384, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 344.985, "r_y0": 692.367, "r_x1": 386.22, "r_y1": 692.367, "r_x2": 386.22, "r_y2": 683.815, "r_x3": 344.985, "r_y3": 683.815, "coord_origin": "TOPLEFT"}, "text": "Figure 14:", "orig": "Figure 14:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.799, "r_y0": 692.367, "r_x1": 508.989, "r_y1": 692.367, "r_x2": 508.989, "r_y2": 683.815, "r_x3": 391.799, "r_y3": 683.815, "coord_origin": "TOPLEFT"}, "text": "Example with multi-line text.", "orig": "Example with multi-line text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 5, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.887715220451355, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 41, "label": "picture", "bbox": {"l": 318.6332092285156, "t": 90.88423156738281, "r": 534.73583984375, "b": 359.0575866699219, "coord_origin": "TOPLEFT"}, "confidence": 0.5003598928451538, "cells": [], "children": []}, {"id": 30, "label": "picture", "bbox": {"l": 51.15378952026367, "t": 104.30851745605469, "r": 282.8598937988281, "b": 344.90667724609375, "coord_origin": "TOPLEFT"}, "confidence": 0.5613773465156555, "cells": [], "children": []}, {"id": 23, "label": "table", "bbox": {"l": 318.9809265136719, "t": 161.23460388183594, "r": 534.6229248046875, "b": 214.6260528564453, "coord_origin": "TOPLEFT"}, "confidence": 0.6235634684562683, "cells": [], "children": []}, {"id": 33, "label": "table", "bbox": {"l": 319.0057678222656, "t": 226.10633850097656, "r": 534.408935546875, "b": 279.8576965332031, "coord_origin": "TOPLEFT"}, "confidence": 0.5502500534057617, "cells": [], "children": []}, {"id": 27, "label": "table", "bbox": {"l": 51.72642135620117, "t": 273.6092834472656, "r": 283.114013671875, "b": 344.2445068359375, "coord_origin": "TOPLEFT"}, "confidence": 0.5696635246276855, "cells": [], "children": []}, {"id": 38, "label": "table", "bbox": {"l": 328.1381530761719, "t": 288.6817932128906, "r": 523.8916015625, "b": 358.2724304199219, "coord_origin": "TOPLEFT"}, "confidence": 0.5227423310279846, "cells": [], "children": []}, {"id": 10, "label": "table", "bbox": {"l": 319.4707946777344, "t": 430.90301513671875, "r": 518.5693359375, "b": 477.94354248046875, "coord_origin": "TOPLEFT"}, "confidence": 0.8384715914726257, "cells": [], "children": []}, {"id": 9, "label": "table", "bbox": {"l": 51.434879302978516, "t": 453.48748779296875, "r": 310.7267150878906, "b": 491.82025146484375, "coord_origin": "TOPLEFT"}, "confidence": 0.8418155908584595, "cells": [], "children": []}, {"id": 8, "label": "table", "bbox": {"l": 319.982666015625, "t": 489.2437438964844, "r": 519.0963745117188, "b": 535.69580078125, "coord_origin": "TOPLEFT"}, "confidence": 0.8502867221832275, "cells": [], "children": []}, {"id": 4, "label": "table", "bbox": {"l": 50.86823654174805, "t": 504.09625244140625, "r": 310.6080017089844, "b": 542.4459838867188, "coord_origin": "TOPLEFT"}, "confidence": 0.8922696709632874, "cells": [], "children": []}, {"id": 15, "label": "table", "bbox": {"l": 319.8287658691406, "t": 546.4093017578125, "r": 519.6065673828125, "b": 593.1064453125, "coord_origin": "TOPLEFT"}, "confidence": 0.6817973256111145, "cells": [], "children": []}, {"id": 6, "label": "table", "bbox": {"l": 51.27280807495117, "t": 553.728515625, "r": 311.0897216796875, "b": 591.913330078125, "coord_origin": "TOPLEFT"}, "confidence": 0.88722163438797, "cells": [], "children": []}, {"id": 7, "label": "table", "bbox": {"l": 319.06494140625, "t": 609.8408203125, "r": 533.77392578125, "b": 669.1920776367188, "coord_origin": "TOPLEFT"}, "confidence": 0.8717735409736633, "cells": [], "children": []}, {"id": 11, "label": "picture", "bbox": {"l": 50.40477752685547, "t": 611.0038452148438, "r": 177.0564422607422, "b": 656.1609497070312, "coord_origin": "TOPLEFT"}, "confidence": 0.7871124744415283, "cells": [], "children": []}]}, "tablestructure": {"table_map": {"23": {"label": "table", "id": 23, "page_no": 13, "cluster": {"id": 23, "label": "table", "bbox": {"l": 318.9809265136719, "t": 161.23460388183594, "r": 534.6229248046875, "b": 214.6260528564453, "coord_origin": "TOPLEFT"}, "confidence": 0.6235634684562683, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "33": {"label": "table", "id": 33, "page_no": 13, "cluster": {"id": 33, "label": "table", "bbox": {"l": 319.0057678222656, "t": 226.10633850097656, "r": 534.408935546875, "b": 279.8576965332031, "coord_origin": "TOPLEFT"}, "confidence": 0.5502500534057617, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "27": {"label": "table", "id": 27, "page_no": 13, "cluster": {"id": 27, "label": "table", "bbox": {"l": 51.72642135620117, "t": 273.6092834472656, "r": 283.114013671875, "b": 344.2445068359375, "coord_origin": "TOPLEFT"}, "confidence": 0.5696635246276855, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "ecel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "38": {"label": "table", "id": 38, "page_no": 13, "cluster": {"id": 38, "label": "table", "bbox": {"l": 328.1381530761719, "t": 288.6817932128906, "r": 523.8916015625, "b": 358.2724304199219, "coord_origin": "TOPLEFT"}, "confidence": 0.5227423310279846, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "10": {"label": "table", "id": 10, "page_no": 13, "cluster": {"id": 10, "label": "table", "bbox": {"l": 319.4707946777344, "t": 430.90301513671875, "r": 518.5693359375, "b": 477.94354248046875, "coord_origin": "TOPLEFT"}, "confidence": 0.8384715914726257, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "9": {"label": "table", "id": 9, "page_no": 13, "cluster": {"id": 9, "label": "table", "bbox": {"l": 51.434879302978516, "t": 453.48748779296875, "r": 310.7267150878906, "b": 491.82025146484375, "coord_origin": "TOPLEFT"}, "confidence": 0.8418155908584595, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "8": {"label": "table", "id": 8, "page_no": 13, "cluster": {"id": 8, "label": "table", "bbox": {"l": 319.982666015625, "t": 489.2437438964844, "r": 519.0963745117188, "b": 535.69580078125, "coord_origin": "TOPLEFT"}, "confidence": 0.8502867221832275, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "4": {"label": "table", "id": 4, "page_no": 13, "cluster": {"id": 4, "label": "table", "bbox": {"l": 50.86823654174805, "t": 504.09625244140625, "r": 310.6080017089844, "b": 542.4459838867188, "coord_origin": "TOPLEFT"}, "confidence": 0.8922696709632874, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "15": {"label": "table", "id": 15, "page_no": 13, "cluster": {"id": 15, "label": "table", "bbox": {"l": 319.8287658691406, "t": 546.4093017578125, "r": 519.6065673828125, "b": 593.1064453125, "coord_origin": "TOPLEFT"}, "confidence": 0.6817973256111145, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "6": {"label": "table", "id": 6, "page_no": 13, "cluster": {"id": 6, "label": "table", "bbox": {"l": 51.27280807495117, "t": 553.728515625, "r": 311.0897216796875, "b": 591.913330078125, "coord_origin": "TOPLEFT"}, "confidence": 0.88722163438797, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "7": {"label": "table", "id": 7, "page_no": 13, "cluster": {"id": 7, "label": "table", "bbox": {"l": 319.06494140625, "t": 609.8408203125, "r": 533.77392578125, "b": 669.1920776367188, "coord_origin": "TOPLEFT"}, "confidence": 0.8717735409736633, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "caption", "id": 0, "page_no": 13, "cluster": {"id": 0, "label": "caption", "bbox": {"l": 50.112, "t": 357.039, "r": 286.365, "b": 377.546, "coord_origin": "TOPLEFT"}, "confidence": 0.951069176197052, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 365.591, "r_x1": 93.051, "r_y1": 365.591, "r_x2": 93.051, "r_y2": 357.039, "r_x3": 50.112, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "Figure 11:", "orig": "Figure 11:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.731, "r_y0": 365.591, "r_x1": 215.67, "r_y1": 365.591, "r_x2": 215.67, "r_y2": 357.039, "r_x3": 103.731, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "Simple table with different", "orig": "Simple table with different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.865, "r_y0": 365.591, "r_x1": 238.684, "r_y1": 365.591, "r_x2": 238.684, "r_y2": 357.039, "r_x3": 219.865, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "style", "orig": "style", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.878, "r_y0": 365.591, "r_x1": 286.365, "r_y1": 365.591, "r_x2": 286.365, "r_y2": 357.039, "r_x3": 242.878, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "and empty", "orig": "and empty", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 377.546, "r_x1": 70.864, "r_y1": 377.546, "r_x2": 70.864, "r_y2": 368.994, "r_x3": 50.112, "r_y3": 368.994, "coord_origin": "TOPLEFT"}, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 11: Simple table with different style and empty cells."}, {"label": "caption", "id": 1, "page_no": 13, "cluster": {"id": 1, "label": "caption", "bbox": {"l": 54.619, "t": 672.087, "r": 281.856, "b": 680.639, "coord_origin": "TOPLEFT"}, "confidence": 0.926384687423706, "cells": [{"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.619, "r_y0": 680.639, "r_x1": 95.854, "r_y1": 680.639, "r_x2": 95.854, "r_y2": 672.087, "r_x3": 54.619, "r_y3": 672.087, "coord_origin": "TOPLEFT"}, "text": "Figure 12:", "orig": "Figure 12:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.433, "r_y0": 680.639, "r_x1": 281.856, "r_y1": 680.639, "r_x2": 281.856, "r_y2": 672.087, "r_x3": 101.433, "r_y3": 672.087, "coord_origin": "TOPLEFT"}, "text": "Simple table predictions and post processing.", "orig": "Simple table predictions and post processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 12: Simple table predictions and post processing."}, {"label": "caption", "id": 3, "page_no": 13, "cluster": {"id": 3, "label": "caption", "bbox": {"l": 315.79, "t": 371.953, "r": 538.185, "b": 380.505, "coord_origin": "TOPLEFT"}, "confidence": 0.9178510904312134, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.79, "r_y0": 380.505, "r_x1": 357.025, "r_y1": 380.505, "r_x2": 357.025, "r_y2": 371.953, "r_x3": 315.79, "r_y3": 371.953, "coord_origin": "TOPLEFT"}, "text": "Figure 13:", "orig": "Figure 13:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.604, "r_y0": 380.505, "r_x1": 538.185, "r_y1": 380.505, "r_x2": 538.185, "r_y2": 371.953, "r_x3": 362.604, "r_y3": 371.953, "coord_origin": "TOPLEFT"}, "text": "Table predictions example on colorful table.", "orig": "Table predictions example on colorful table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 13: Table predictions example on colorful table."}, {"label": "caption", "id": 2, "page_no": 13, "cluster": {"id": 2, "label": "caption", "bbox": {"l": 344.985, "t": 683.815, "r": 508.989, "b": 692.367, "coord_origin": "TOPLEFT"}, "confidence": 0.9191023111343384, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 344.985, "r_y0": 692.367, "r_x1": 386.22, "r_y1": 692.367, "r_x2": 386.22, "r_y2": 683.815, "r_x3": 344.985, "r_y3": 683.815, "coord_origin": "TOPLEFT"}, "text": "Figure 14:", "orig": "Figure 14:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.799, "r_y0": 692.367, "r_x1": 508.989, "r_y1": 692.367, "r_x2": 508.989, "r_y2": 683.815, "r_x3": 391.799, "r_y3": 683.815, "coord_origin": "TOPLEFT"}, "text": "Example with multi-line text.", "orig": "Example with multi-line text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 14: Example with multi-line text."}, {"label": "page_footer", "id": 5, "page_no": 13, "cluster": {"id": 5, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.887715220451355, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "14"}, {"label": "picture", "id": 41, "page_no": 13, "cluster": {"id": 41, "label": "picture", "bbox": {"l": 318.6332092285156, "t": 90.88423156738281, "r": 534.73583984375, "b": 359.0575866699219, "coord_origin": "TOPLEFT"}, "confidence": 0.5003598928451538, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 30, "page_no": 13, "cluster": {"id": 30, "label": "picture", "bbox": {"l": 51.15378952026367, "t": 104.30851745605469, "r": 282.8598937988281, "b": 344.90667724609375, "coord_origin": "TOPLEFT"}, "confidence": 0.5613773465156555, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 23, "page_no": 13, "cluster": {"id": 23, "label": "table", "bbox": {"l": 318.9809265136719, "t": 161.23460388183594, "r": 534.6229248046875, "b": 214.6260528564453, "coord_origin": "TOPLEFT"}, "confidence": 0.6235634684562683, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 33, "page_no": 13, "cluster": {"id": 33, "label": "table", "bbox": {"l": 319.0057678222656, "t": 226.10633850097656, "r": 534.408935546875, "b": 279.8576965332031, "coord_origin": "TOPLEFT"}, "confidence": 0.5502500534057617, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 27, "page_no": 13, "cluster": {"id": 27, "label": "table", "bbox": {"l": 51.72642135620117, "t": 273.6092834472656, "r": 283.114013671875, "b": 344.2445068359375, "coord_origin": "TOPLEFT"}, "confidence": 0.5696635246276855, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "ecel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 38, "page_no": 13, "cluster": {"id": 38, "label": "table", "bbox": {"l": 328.1381530761719, "t": 288.6817932128906, "r": 523.8916015625, "b": 358.2724304199219, "coord_origin": "TOPLEFT"}, "confidence": 0.5227423310279846, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 10, "page_no": 13, "cluster": {"id": 10, "label": "table", "bbox": {"l": 319.4707946777344, "t": 430.90301513671875, "r": 518.5693359375, "b": 477.94354248046875, "coord_origin": "TOPLEFT"}, "confidence": 0.8384715914726257, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 9, "page_no": 13, "cluster": {"id": 9, "label": "table", "bbox": {"l": 51.434879302978516, "t": 453.48748779296875, "r": 310.7267150878906, "b": 491.82025146484375, "coord_origin": "TOPLEFT"}, "confidence": 0.8418155908584595, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 8, "page_no": 13, "cluster": {"id": 8, "label": "table", "bbox": {"l": 319.982666015625, "t": 489.2437438964844, "r": 519.0963745117188, "b": 535.69580078125, "coord_origin": "TOPLEFT"}, "confidence": 0.8502867221832275, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 4, "page_no": 13, "cluster": {"id": 4, "label": "table", "bbox": {"l": 50.86823654174805, "t": 504.09625244140625, "r": 310.6080017089844, "b": 542.4459838867188, "coord_origin": "TOPLEFT"}, "confidence": 0.8922696709632874, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 15, "page_no": 13, "cluster": {"id": 15, "label": "table", "bbox": {"l": 319.8287658691406, "t": 546.4093017578125, "r": 519.6065673828125, "b": 593.1064453125, "coord_origin": "TOPLEFT"}, "confidence": 0.6817973256111145, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 6, "page_no": 13, "cluster": {"id": 6, "label": "table", "bbox": {"l": 51.27280807495117, "t": 553.728515625, "r": 311.0897216796875, "b": 591.913330078125, "coord_origin": "TOPLEFT"}, "confidence": 0.88722163438797, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 7, "page_no": 13, "cluster": {"id": 7, "label": "table", "bbox": {"l": 319.06494140625, "t": 609.8408203125, "r": 533.77392578125, "b": 669.1920776367188, "coord_origin": "TOPLEFT"}, "confidence": 0.8717735409736633, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 11, "page_no": 13, "cluster": {"id": 11, "label": "picture", "bbox": {"l": 50.40477752685547, "t": 611.0038452148438, "r": 177.0564422607422, "b": 656.1609497070312, "coord_origin": "TOPLEFT"}, "confidence": 0.7871124744415283, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}], "body": [{"label": "caption", "id": 0, "page_no": 13, "cluster": {"id": 0, "label": "caption", "bbox": {"l": 50.112, "t": 357.039, "r": 286.365, "b": 377.546, "coord_origin": "TOPLEFT"}, "confidence": 0.951069176197052, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 365.591, "r_x1": 93.051, "r_y1": 365.591, "r_x2": 93.051, "r_y2": 357.039, "r_x3": 50.112, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "Figure 11:", "orig": "Figure 11:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 103.731, "r_y0": 365.591, "r_x1": 215.67, "r_y1": 365.591, "r_x2": 215.67, "r_y2": 357.039, "r_x3": 103.731, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "Simple table with different", "orig": "Simple table with different", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 219.865, "r_y0": 365.591, "r_x1": 238.684, "r_y1": 365.591, "r_x2": 238.684, "r_y2": 357.039, "r_x3": 219.865, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "style", "orig": "style", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 242.878, "r_y0": 365.591, "r_x1": 286.365, "r_y1": 365.591, "r_x2": 286.365, "r_y2": 357.039, "r_x3": 242.878, "r_y3": 357.039, "coord_origin": "TOPLEFT"}, "text": "and empty", "orig": "and empty", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 377.546, "r_x1": 70.864, "r_y1": 377.546, "r_x2": 70.864, "r_y2": 368.994, "r_x3": 50.112, "r_y3": 368.994, "coord_origin": "TOPLEFT"}, "text": "cells.", "orig": "cells.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 11: Simple table with different style and empty cells."}, {"label": "caption", "id": 1, "page_no": 13, "cluster": {"id": 1, "label": "caption", "bbox": {"l": 54.619, "t": 672.087, "r": 281.856, "b": 680.639, "coord_origin": "TOPLEFT"}, "confidence": 0.926384687423706, "cells": [{"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 54.619, "r_y0": 680.639, "r_x1": 95.854, "r_y1": 680.639, "r_x2": 95.854, "r_y2": 672.087, "r_x3": 54.619, "r_y3": 672.087, "coord_origin": "TOPLEFT"}, "text": "Figure 12:", "orig": "Figure 12:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 6, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 101.433, "r_y0": 680.639, "r_x1": 281.856, "r_y1": 680.639, "r_x2": 281.856, "r_y2": 672.087, "r_x3": 101.433, "r_y3": 672.087, "coord_origin": "TOPLEFT"}, "text": "Simple table predictions and post processing.", "orig": "Simple table predictions and post processing.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 12: Simple table predictions and post processing."}, {"label": "caption", "id": 3, "page_no": 13, "cluster": {"id": 3, "label": "caption", "bbox": {"l": 315.79, "t": 371.953, "r": 538.185, "b": 380.505, "coord_origin": "TOPLEFT"}, "confidence": 0.9178510904312134, "cells": [{"index": 7, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 315.79, "r_y0": 380.505, "r_x1": 357.025, "r_y1": 380.505, "r_x2": 357.025, "r_y2": 371.953, "r_x3": 315.79, "r_y3": 371.953, "coord_origin": "TOPLEFT"}, "text": "Figure 13:", "orig": "Figure 13:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 8, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 362.604, "r_y0": 380.505, "r_x1": 538.185, "r_y1": 380.505, "r_x2": 538.185, "r_y2": 371.953, "r_x3": 362.604, "r_y3": 371.953, "coord_origin": "TOPLEFT"}, "text": "Table predictions example on colorful table.", "orig": "Table predictions example on colorful table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 13: Table predictions example on colorful table."}, {"label": "caption", "id": 2, "page_no": 13, "cluster": {"id": 2, "label": "caption", "bbox": {"l": 344.985, "t": 683.815, "r": 508.989, "b": 692.367, "coord_origin": "TOPLEFT"}, "confidence": 0.9191023111343384, "cells": [{"index": 9, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 344.985, "r_y0": 692.367, "r_x1": 386.22, "r_y1": 692.367, "r_x2": 386.22, "r_y2": 683.815, "r_x3": 344.985, "r_y3": 683.815, "coord_origin": "TOPLEFT"}, "text": "Figure 14:", "orig": "Figure 14:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 10, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 391.799, "r_y0": 692.367, "r_x1": 508.989, "r_y1": 692.367, "r_x2": 508.989, "r_y2": 683.815, "r_x3": 391.799, "r_y3": 683.815, "coord_origin": "TOPLEFT"}, "text": "Example with multi-line text.", "orig": "Example with multi-line text.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 14: Example with multi-line text."}, {"label": "picture", "id": 41, "page_no": 13, "cluster": {"id": 41, "label": "picture", "bbox": {"l": 318.6332092285156, "t": 90.88423156738281, "r": 534.73583984375, "b": 359.0575866699219, "coord_origin": "TOPLEFT"}, "confidence": 0.5003598928451538, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 30, "page_no": 13, "cluster": {"id": 30, "label": "picture", "bbox": {"l": 51.15378952026367, "t": 104.30851745605469, "r": 282.8598937988281, "b": 344.90667724609375, "coord_origin": "TOPLEFT"}, "confidence": 0.5613773465156555, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 23, "page_no": 13, "cluster": {"id": 23, "label": "table", "bbox": {"l": 318.9809265136719, "t": 161.23460388183594, "r": 534.6229248046875, "b": 214.6260528564453, "coord_origin": "TOPLEFT"}, "confidence": 0.6235634684562683, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 33, "page_no": 13, "cluster": {"id": 33, "label": "table", "bbox": {"l": 319.0057678222656, "t": 226.10633850097656, "r": 534.408935546875, "b": 279.8576965332031, "coord_origin": "TOPLEFT"}, "confidence": 0.5502500534057617, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 27, "page_no": 13, "cluster": {"id": 27, "label": "table", "bbox": {"l": 51.72642135620117, "t": 273.6092834472656, "r": 283.114013671875, "b": 344.2445068359375, "coord_origin": "TOPLEFT"}, "confidence": 0.5696635246276855, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "ecel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "ecel", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 38, "page_no": 13, "cluster": {"id": 38, "label": "table", "bbox": {"l": 328.1381530761719, "t": 288.6817932128906, "r": 523.8916015625, "b": 358.2724304199219, "coord_origin": "TOPLEFT"}, "confidence": 0.5227423310279846, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 10, "page_no": 13, "cluster": {"id": 10, "label": "table", "bbox": {"l": 319.4707946777344, "t": 430.90301513671875, "r": 518.5693359375, "b": 477.94354248046875, "coord_origin": "TOPLEFT"}, "confidence": 0.8384715914726257, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 9, "page_no": 13, "cluster": {"id": 9, "label": "table", "bbox": {"l": 51.434879302978516, "t": 453.48748779296875, "r": 310.7267150878906, "b": 491.82025146484375, "coord_origin": "TOPLEFT"}, "confidence": 0.8418155908584595, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 8, "page_no": 13, "cluster": {"id": 8, "label": "table", "bbox": {"l": 319.982666015625, "t": 489.2437438964844, "r": 519.0963745117188, "b": 535.69580078125, "coord_origin": "TOPLEFT"}, "confidence": 0.8502867221832275, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 4, "page_no": 13, "cluster": {"id": 4, "label": "table", "bbox": {"l": 50.86823654174805, "t": 504.09625244140625, "r": 310.6080017089844, "b": 542.4459838867188, "coord_origin": "TOPLEFT"}, "confidence": 0.8922696709632874, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 15, "page_no": 13, "cluster": {"id": 15, "label": "table", "bbox": {"l": 319.8287658691406, "t": 546.4093017578125, "r": 519.6065673828125, "b": 593.1064453125, "coord_origin": "TOPLEFT"}, "confidence": 0.6817973256111145, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 6, "page_no": 13, "cluster": {"id": 6, "label": "table", "bbox": {"l": 51.27280807495117, "t": 553.728515625, "r": 311.0897216796875, "b": 591.913330078125, "coord_origin": "TOPLEFT"}, "confidence": 0.88722163438797, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl", "rhed", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 7, "page_no": 13, "cluster": {"id": 7, "label": "table", "bbox": {"l": 319.06494140625, "t": 609.8408203125, "r": 533.77392578125, "b": 669.1920776367188, "coord_origin": "TOPLEFT"}, "confidence": 0.8717735409736633, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 11, "page_no": 13, "cluster": {"id": 11, "label": "picture", "bbox": {"l": 50.40477752685547, "t": 611.0038452148438, "r": 177.0564422607422, "b": 656.1609497070312, "coord_origin": "TOPLEFT"}, "confidence": 0.7871124744415283, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}], "headers": [{"label": "page_footer", "id": 5, "page_no": 13, "cluster": {"id": 5, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.887715220451355, "cells": [{"index": 11, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "14", "orig": "14", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "14"}]}}, {"page_no": 14, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 84.233, "r_y0": 653.172, "r_x1": 125.468, "r_y1": 653.172, "r_x2": 125.468, "r_y2": 644.62, "r_x3": 84.233, "r_y3": 644.62, "coord_origin": "TOPLEFT"}, "text": "Figure 15:", "orig": "Figure 15:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 131.047, "r_y0": 653.172, "r_x1": 252.242, "r_y1": 653.172, "r_x2": 252.242, "r_y2": 644.62, "r_x3": 131.047, "r_y3": 644.62, "coord_origin": "TOPLEFT"}, "text": "Example with triangular table.", "orig": "Example with triangular table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 661.756, "r_x1": 349.559, "r_y1": 661.756, "r_x2": 349.559, "r_y2": 653.204, "r_x3": 308.862, "r_y3": 653.204, "coord_origin": "TOPLEFT"}, "text": "Figure 16:", "orig": "Figure 16:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.341, "r_y0": 661.756, "r_x1": 545.115, "r_y1": 661.756, "r_x2": 545.115, "r_y2": 653.204, "r_x3": 354.341, "r_y3": 653.204, "coord_origin": "TOPLEFT"}, "text": "Example of how post-processing helps to restore", "orig": "Example of how post-processing helps to restore", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 673.711, "r_x1": 497.603, "r_y1": 673.711, "r_x2": 497.603, "r_y2": 665.159, "r_x3": 308.862, "r_y3": 665.159, "coord_origin": "TOPLEFT"}, "text": "mis-aligned bounding boxes prediction artifact.", "orig": "mis-aligned bounding boxes prediction artifact.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 0, "label": "caption", "bbox": {"l": 84.233, "t": 644.62, "r": 252.242, "b": 653.172, "coord_origin": "TOPLEFT"}, "confidence": 0.9257225394248962, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 84.233, "r_y0": 653.172, "r_x1": 125.468, "r_y1": 653.172, "r_x2": 125.468, "r_y2": 644.62, "r_x3": 84.233, "r_y3": 644.62, "coord_origin": "TOPLEFT"}, "text": "Figure 15:", "orig": "Figure 15:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 131.047, "r_y0": 653.172, "r_x1": 252.242, "r_y1": 653.172, "r_x2": 252.242, "r_y2": 644.62, "r_x3": 131.047, "r_y3": 644.62, "coord_origin": "TOPLEFT"}, "text": "Example with triangular table.", "orig": "Example with triangular table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "caption", "bbox": {"l": 308.862, "t": 653.204, "r": 545.115, "b": 673.711, "coord_origin": "TOPLEFT"}, "confidence": 0.9134758710861206, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 661.756, "r_x1": 349.559, "r_y1": 661.756, "r_x2": 349.559, "r_y2": 653.204, "r_x3": 308.862, "r_y3": 653.204, "coord_origin": "TOPLEFT"}, "text": "Figure 16:", "orig": "Figure 16:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.341, "r_y0": 661.756, "r_x1": 545.115, "r_y1": 661.756, "r_x2": 545.115, "r_y2": 653.204, "r_x3": 354.341, "r_y3": 653.204, "coord_origin": "TOPLEFT"}, "text": "Example of how post-processing helps to restore", "orig": "Example of how post-processing helps to restore", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 673.711, "r_x1": 497.603, "r_y1": 673.711, "r_x2": 497.603, "r_y2": 665.159, "r_x3": 308.862, "r_y3": 665.159, "coord_origin": "TOPLEFT"}, "text": "mis-aligned bounding boxes prediction artifact.", "orig": "mis-aligned bounding boxes prediction artifact.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 3, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9037020802497864, "cells": [{"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 4, "label": "table", "bbox": {"l": 323.0059509277344, "t": 121.54714965820312, "r": 525.95166015625, "b": 222.91140747070312, "coord_origin": "TOPLEFT"}, "confidence": 0.8569068908691406, "cells": [], "children": []}, {"id": 6, "label": "picture", "bbox": {"l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT"}, "confidence": 0.8099280595779419, "cells": [], "children": []}, {"id": 19, "label": "table", "bbox": {"l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT"}, "confidence": 0.5584819912910461, "cells": [], "children": []}, {"id": 2, "label": "table", "bbox": {"l": 323.384765625, "t": 241.9729461669922, "r": 526.1268920898438, "b": 344.09210205078125, "coord_origin": "TOPLEFT"}, "confidence": 0.9060239195823669, "cells": [], "children": []}, {"id": 18, "label": "picture", "bbox": {"l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT"}, "confidence": 0.567050039768219, "cells": [], "children": []}, {"id": 10, "label": "table", "bbox": {"l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT"}, "confidence": 0.7748245000839233, "cells": [], "children": []}, {"id": 20, "label": "picture", "bbox": {"l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT"}, "confidence": 0.5515198707580566, "cells": [], "children": []}, {"id": 9, "label": "table", "bbox": {"l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT"}, "confidence": 0.7755160927772522, "cells": [], "children": []}, {"id": 5, "label": "picture", "bbox": {"l": 55.423954010009766, "t": 384.5550537109375, "r": 280.2310791015625, "b": 497.563720703125, "coord_origin": "TOPLEFT"}, "confidence": 0.8410326838493347, "cells": [], "children": []}, {"id": 22, "label": "picture", "bbox": {"l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT"}, "confidence": 0.5478786826133728, "cells": [], "children": []}, {"id": 8, "label": "table", "bbox": {"l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT"}, "confidence": 0.7805566787719727, "cells": [], "children": []}, {"id": 7, "label": "picture", "bbox": {"l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.8057592511177063, "cells": [], "children": []}, {"id": 11, "label": "table", "bbox": {"l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.6835257411003113, "cells": [], "children": []}]}, "tablestructure": {"table_map": {"4": {"label": "table", "id": 4, "page_no": 14, "cluster": {"id": 4, "label": "table", "bbox": {"l": 323.0059509277344, "t": 121.54714965820312, "r": 525.95166015625, "b": 222.91140747070312, "coord_origin": "TOPLEFT"}, "confidence": 0.8569068908691406, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "19": {"label": "table", "id": 19, "page_no": 14, "cluster": {"id": 19, "label": "table", "bbox": {"l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT"}, "confidence": 0.5584819912910461, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "2": {"label": "table", "id": 2, "page_no": 14, "cluster": {"id": 2, "label": "table", "bbox": {"l": 323.384765625, "t": 241.9729461669922, "r": 526.1268920898438, "b": 344.09210205078125, "coord_origin": "TOPLEFT"}, "confidence": 0.9060239195823669, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "10": {"label": "table", "id": 10, "page_no": 14, "cluster": {"id": 10, "label": "table", "bbox": {"l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT"}, "confidence": 0.7748245000839233, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "9": {"label": "table", "id": 9, "page_no": 14, "cluster": {"id": 9, "label": "table", "bbox": {"l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT"}, "confidence": 0.7755160927772522, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "8": {"label": "table", "id": 8, "page_no": 14, "cluster": {"id": 8, "label": "table", "bbox": {"l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT"}, "confidence": 0.7805566787719727, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, "11": {"label": "table", "id": 11, "page_no": 14, "cluster": {"id": 11, "label": "table", "bbox": {"l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.6835257411003113, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "caption", "id": 0, "page_no": 14, "cluster": {"id": 0, "label": "caption", "bbox": {"l": 84.233, "t": 644.62, "r": 252.242, "b": 653.172, "coord_origin": "TOPLEFT"}, "confidence": 0.9257225394248962, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 84.233, "r_y0": 653.172, "r_x1": 125.468, "r_y1": 653.172, "r_x2": 125.468, "r_y2": 644.62, "r_x3": 84.233, "r_y3": 644.62, "coord_origin": "TOPLEFT"}, "text": "Figure 15:", "orig": "Figure 15:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 131.047, "r_y0": 653.172, "r_x1": 252.242, "r_y1": 653.172, "r_x2": 252.242, "r_y2": 644.62, "r_x3": 131.047, "r_y3": 644.62, "coord_origin": "TOPLEFT"}, "text": "Example with triangular table.", "orig": "Example with triangular table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 15: Example with triangular table."}, {"label": "caption", "id": 1, "page_no": 14, "cluster": {"id": 1, "label": "caption", "bbox": {"l": 308.862, "t": 653.204, "r": 545.115, "b": 673.711, "coord_origin": "TOPLEFT"}, "confidence": 0.9134758710861206, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 661.756, "r_x1": 349.559, "r_y1": 661.756, "r_x2": 349.559, "r_y2": 653.204, "r_x3": 308.862, "r_y3": 653.204, "coord_origin": "TOPLEFT"}, "text": "Figure 16:", "orig": "Figure 16:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.341, "r_y0": 661.756, "r_x1": 545.115, "r_y1": 661.756, "r_x2": 545.115, "r_y2": 653.204, "r_x3": 354.341, "r_y3": 653.204, "coord_origin": "TOPLEFT"}, "text": "Example of how post-processing helps to restore", "orig": "Example of how post-processing helps to restore", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 673.711, "r_x1": 497.603, "r_y1": 673.711, "r_x2": 497.603, "r_y2": 665.159, "r_x3": 308.862, "r_y3": 665.159, "coord_origin": "TOPLEFT"}, "text": "mis-aligned bounding boxes prediction artifact.", "orig": "mis-aligned bounding boxes prediction artifact.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 16: Example of how post-processing helps to restore mis-aligned bounding boxes prediction artifact."}, {"label": "page_footer", "id": 3, "page_no": 14, "cluster": {"id": 3, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9037020802497864, "cells": [{"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "15"}, {"label": "table", "id": 4, "page_no": 14, "cluster": {"id": 4, "label": "table", "bbox": {"l": 323.0059509277344, "t": 121.54714965820312, "r": 525.95166015625, "b": 222.91140747070312, "coord_origin": "TOPLEFT"}, "confidence": 0.8569068908691406, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 6, "page_no": 14, "cluster": {"id": 6, "label": "picture", "bbox": {"l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT"}, "confidence": 0.8099280595779419, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 19, "page_no": 14, "cluster": {"id": 19, "label": "table", "bbox": {"l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT"}, "confidence": 0.5584819912910461, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 2, "page_no": 14, "cluster": {"id": 2, "label": "table", "bbox": {"l": 323.384765625, "t": 241.9729461669922, "r": 526.1268920898438, "b": 344.09210205078125, "coord_origin": "TOPLEFT"}, "confidence": 0.9060239195823669, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 18, "page_no": 14, "cluster": {"id": 18, "label": "picture", "bbox": {"l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT"}, "confidence": 0.567050039768219, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 10, "page_no": 14, "cluster": {"id": 10, "label": "table", "bbox": {"l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT"}, "confidence": 0.7748245000839233, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 20, "page_no": 14, "cluster": {"id": 20, "label": "picture", "bbox": {"l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT"}, "confidence": 0.5515198707580566, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 9, "page_no": 14, "cluster": {"id": 9, "label": "table", "bbox": {"l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT"}, "confidence": 0.7755160927772522, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 5, "page_no": 14, "cluster": {"id": 5, "label": "picture", "bbox": {"l": 55.423954010009766, "t": 384.5550537109375, "r": 280.2310791015625, "b": 497.563720703125, "coord_origin": "TOPLEFT"}, "confidence": 0.8410326838493347, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 22, "page_no": 14, "cluster": {"id": 22, "label": "picture", "bbox": {"l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT"}, "confidence": 0.5478786826133728, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 8, "page_no": 14, "cluster": {"id": 8, "label": "table", "bbox": {"l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT"}, "confidence": 0.7805566787719727, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 7, "page_no": 14, "cluster": {"id": 7, "label": "picture", "bbox": {"l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.8057592511177063, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 11, "page_no": 14, "cluster": {"id": 11, "label": "table", "bbox": {"l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.6835257411003113, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}], "body": [{"label": "caption", "id": 0, "page_no": 14, "cluster": {"id": 0, "label": "caption", "bbox": {"l": 84.233, "t": 644.62, "r": 252.242, "b": 653.172, "coord_origin": "TOPLEFT"}, "confidence": 0.9257225394248962, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 84.233, "r_y0": 653.172, "r_x1": 125.468, "r_y1": 653.172, "r_x2": 125.468, "r_y2": 644.62, "r_x3": 84.233, "r_y3": 644.62, "coord_origin": "TOPLEFT"}, "text": "Figure 15:", "orig": "Figure 15:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 131.047, "r_y0": 653.172, "r_x1": 252.242, "r_y1": 653.172, "r_x2": 252.242, "r_y2": 644.62, "r_x3": 131.047, "r_y3": 644.62, "coord_origin": "TOPLEFT"}, "text": "Example with triangular table.", "orig": "Example with triangular table.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 15: Example with triangular table."}, {"label": "caption", "id": 1, "page_no": 14, "cluster": {"id": 1, "label": "caption", "bbox": {"l": 308.862, "t": 653.204, "r": 545.115, "b": 673.711, "coord_origin": "TOPLEFT"}, "confidence": 0.9134758710861206, "cells": [{"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 661.756, "r_x1": 349.559, "r_y1": 661.756, "r_x2": 349.559, "r_y2": 653.204, "r_x3": 308.862, "r_y3": 653.204, "coord_origin": "TOPLEFT"}, "text": "Figure 16:", "orig": "Figure 16:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 354.341, "r_y0": 661.756, "r_x1": 545.115, "r_y1": 661.756, "r_x2": 545.115, "r_y2": 653.204, "r_x3": 354.341, "r_y3": 653.204, "coord_origin": "TOPLEFT"}, "text": "Example of how post-processing helps to restore", "orig": "Example of how post-processing helps to restore", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 4, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 308.862, "r_y0": 673.711, "r_x1": 497.603, "r_y1": 673.711, "r_x2": 497.603, "r_y2": 665.159, "r_x3": 308.862, "r_y3": 665.159, "coord_origin": "TOPLEFT"}, "text": "mis-aligned bounding boxes prediction artifact.", "orig": "mis-aligned bounding boxes prediction artifact.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 16: Example of how post-processing helps to restore mis-aligned bounding boxes prediction artifact."}, {"label": "table", "id": 4, "page_no": 14, "cluster": {"id": 4, "label": "table", "bbox": {"l": 323.0059509277344, "t": 121.54714965820312, "r": 525.95166015625, "b": 222.91140747070312, "coord_origin": "TOPLEFT"}, "confidence": 0.8569068908691406, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 6, "page_no": 14, "cluster": {"id": 6, "label": "picture", "bbox": {"l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT"}, "confidence": 0.8099280595779419, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 19, "page_no": 14, "cluster": {"id": 19, "label": "table", "bbox": {"l": 55.116363525390625, "t": 136.2550048828125, "r": 279.370849609375, "b": 249.3345489501953, "coord_origin": "TOPLEFT"}, "confidence": 0.5584819912910461, "cells": [], "children": []}, "text": null, "otsl_seq": ["ecel", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "rhed", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "fcel", "nl", "rhed", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "ecel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "table", "id": 2, "page_no": 14, "cluster": {"id": 2, "label": "table", "bbox": {"l": 323.384765625, "t": 241.9729461669922, "r": 526.1268920898438, "b": 344.09210205078125, "coord_origin": "TOPLEFT"}, "confidence": 0.9060239195823669, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 18, "page_no": 14, "cluster": {"id": 18, "label": "picture", "bbox": {"l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT"}, "confidence": 0.567050039768219, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 10, "page_no": 14, "cluster": {"id": 10, "label": "table", "bbox": {"l": 54.28135299682617, "t": 260.2615661621094, "r": 279.2568359375, "b": 373.5270690917969, "coord_origin": "TOPLEFT"}, "confidence": 0.7748245000839233, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 20, "page_no": 14, "cluster": {"id": 20, "label": "picture", "bbox": {"l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT"}, "confidence": 0.5515198707580566, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 9, "page_no": 14, "cluster": {"id": 9, "label": "table", "bbox": {"l": 323.46868896484375, "t": 362.4508361816406, "r": 525.9569091796875, "b": 464.260498046875, "coord_origin": "TOPLEFT"}, "confidence": 0.7755160927772522, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl", "rhed", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 5, "page_no": 14, "cluster": {"id": 5, "label": "picture", "bbox": {"l": 55.423954010009766, "t": 384.5550537109375, "r": 280.2310791015625, "b": 497.563720703125, "coord_origin": "TOPLEFT"}, "confidence": 0.8410326838493347, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "picture", "id": 22, "page_no": 14, "cluster": {"id": 22, "label": "picture", "bbox": {"l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT"}, "confidence": 0.5478786826133728, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 8, "page_no": 14, "cluster": {"id": 8, "label": "table", "bbox": {"l": 353.6920471191406, "t": 487.405029296875, "r": 495.4288024902344, "b": 635.7732543945312, "coord_origin": "TOPLEFT"}, "confidence": 0.7805566787719727, "cells": [], "children": []}, "text": null, "otsl_seq": ["fcel", "ched", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}, {"label": "picture", "id": 7, "page_no": 14, "cluster": {"id": 7, "label": "picture", "bbox": {"l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.8057592511177063, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}, {"label": "table", "id": 11, "page_no": 14, "cluster": {"id": 11, "label": "table", "bbox": {"l": 50.64818572998047, "t": 505.98046875, "r": 319.9103088378906, "b": 631.263671875, "coord_origin": "TOPLEFT"}, "confidence": 0.6835257411003113, "cells": [], "children": []}, "text": null, "otsl_seq": ["ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "ched", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "fcel", "nl"], "num_rows": 0, "num_cols": 0, "table_cells": []}], "headers": [{"label": "page_footer", "id": 3, "page_no": 14, "cluster": {"id": 3, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9037020802497864, "cells": [{"index": 5, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "15", "orig": "15", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "15"}]}}, {"page_no": 15, "size": {"width": 612.0, "height": 792.0}, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 517.158, "r_x1": 91.198, "r_y1": 517.158, "r_x2": 91.198, "r_y2": 508.606, "r_x3": 50.112, "r_y3": 508.606, "coord_origin": "TOPLEFT"}, "text": "Figure 17:", "orig": "Figure 17:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.558, "r_y0": 517.158, "r_x1": 545.114, "r_y1": 517.158, "r_x2": 545.114, "r_y2": 508.606, "r_x3": 96.558, "r_y3": 508.606, "coord_origin": "TOPLEFT"}, "text": "Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "orig": "Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 529.113, "r_x1": 173.24, "r_y1": 529.113, "r_x2": 173.24, "r_y2": 520.5609999999999, "r_x3": 50.112, "r_y3": 520.5609999999999, "coord_origin": "TOPLEFT"}, "text": "ing and prediction of structure.", "orig": "ing and prediction of structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "parsed_page": null, "predictions": {"layout": {"clusters": [{"id": 0, "label": "caption", "bbox": {"l": 50.112, "t": 508.606, "r": 545.114, "b": 529.113, "coord_origin": "TOPLEFT"}, "confidence": 0.9624594449996948, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 517.158, "r_x1": 91.198, "r_y1": 517.158, "r_x2": 91.198, "r_y2": 508.606, "r_x3": 50.112, "r_y3": 508.606, "coord_origin": "TOPLEFT"}, "text": "Figure 17:", "orig": "Figure 17:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.558, "r_y0": 517.158, "r_x1": 545.114, "r_y1": 517.158, "r_x2": 545.114, "r_y2": 508.606, "r_x3": 96.558, "r_y3": 508.606, "coord_origin": "TOPLEFT"}, "text": "Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "orig": "Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 529.113, "r_x1": 173.24, "r_y1": 529.113, "r_x2": 173.24, "r_y2": 520.5609999999999, "r_x3": 50.112, "r_y3": 520.5609999999999, "coord_origin": "TOPLEFT"}, "text": "ing and prediction of structure.", "orig": "ing and prediction of structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 1, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9134101271629333, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, {"id": 2, "label": "picture", "bbox": {"l": 66.79948425292969, "t": 253.61631774902344, "r": 528.5565795898438, "b": 498.1383972167969, "coord_origin": "TOPLEFT"}, "confidence": 0.6913455724716187, "cells": [], "children": []}]}, "tablestructure": {"table_map": {}}, "figures_classification": null, "equations_prediction": null, "vlm_response": null}, "assembled": {"elements": [{"label": "caption", "id": 0, "page_no": 15, "cluster": {"id": 0, "label": "caption", "bbox": {"l": 50.112, "t": 508.606, "r": 545.114, "b": 529.113, "coord_origin": "TOPLEFT"}, "confidence": 0.9624594449996948, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 517.158, "r_x1": 91.198, "r_y1": 517.158, "r_x2": 91.198, "r_y2": 508.606, "r_x3": 50.112, "r_y3": 508.606, "coord_origin": "TOPLEFT"}, "text": "Figure 17:", "orig": "Figure 17:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.558, "r_y0": 517.158, "r_x1": 545.114, "r_y1": 517.158, "r_x2": 545.114, "r_y2": 508.606, "r_x3": 96.558, "r_y3": 508.606, "coord_origin": "TOPLEFT"}, "text": "Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "orig": "Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 529.113, "r_x1": 173.24, "r_y1": 529.113, "r_x2": 173.24, "r_y2": 520.5609999999999, "r_x3": 50.112, "r_y3": 520.5609999999999, "coord_origin": "TOPLEFT"}, "text": "ing and prediction of structure.", "orig": "ing and prediction of structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post processing and prediction of structure."}, {"label": "page_footer", "id": 1, "page_no": 15, "cluster": {"id": 1, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9134101271629333, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "16"}, {"label": "picture", "id": 2, "page_no": 15, "cluster": {"id": 2, "label": "picture", "bbox": {"l": 66.79948425292969, "t": 253.61631774902344, "r": 528.5565795898438, "b": 498.1383972167969, "coord_origin": "TOPLEFT"}, "confidence": 0.6913455724716187, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}], "body": [{"label": "caption", "id": 0, "page_no": 15, "cluster": {"id": 0, "label": "caption", "bbox": {"l": 50.112, "t": 508.606, "r": 545.114, "b": 529.113, "coord_origin": "TOPLEFT"}, "confidence": 0.9624594449996948, "cells": [{"index": 0, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 517.158, "r_x1": 91.198, "r_y1": 517.158, "r_x2": 91.198, "r_y2": 508.606, "r_x3": 50.112, "r_y3": 508.606, "coord_origin": "TOPLEFT"}, "text": "Figure 17:", "orig": "Figure 17:", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 1, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 96.558, "r_y0": 517.158, "r_x1": 545.114, "r_y1": 517.158, "r_x2": 545.114, "r_y2": 508.606, "r_x3": 96.558, "r_y3": 508.606, "coord_origin": "TOPLEFT"}, "text": "Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "orig": "Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post process-", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}, {"index": 2, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 50.112, "r_y0": 529.113, "r_x1": 173.24, "r_y1": 529.113, "r_x2": 173.24, "r_y2": 520.5609999999999, "r_x3": 50.112, "r_y3": 520.5609999999999, "coord_origin": "TOPLEFT"}, "text": "ing and prediction of structure.", "orig": "ing and prediction of structure.", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "Figure 17: Example of long table. End-to-end example from initial PDF cells to prediction of bounding boxes, post processing and prediction of structure."}, {"label": "picture", "id": 2, "page_no": 15, "cluster": {"id": 2, "label": "picture", "bbox": {"l": 66.79948425292969, "t": 253.61631774902344, "r": 528.5565795898438, "b": 498.1383972167969, "coord_origin": "TOPLEFT"}, "confidence": 0.6913455724716187, "cells": [], "children": []}, "text": "", "annotations": [], "provenance": null, "predicted_class": null, "confidence": null}], "headers": [{"label": "page_footer", "id": 1, "page_no": 15, "cluster": {"id": 1, "label": "page_footer", "bbox": {"l": 292.631, "t": 734.402, "r": 302.594, "b": 742.954, "coord_origin": "TOPLEFT"}, "confidence": 0.9134101271629333, "cells": [{"index": 3, "rgba": {"r": 0, "g": 0, "b": 0, "a": 255}, "rect": {"r_x0": 292.631, "r_y0": 742.954, "r_x1": 302.594, "r_y1": 742.954, "r_x2": 302.594, "r_y2": 734.402, "r_x3": 292.631, "r_y3": 734.402, "coord_origin": "TOPLEFT"}, "text": "16", "orig": "16", "text_direction": "left_to_right", "confidence": 1.0, "from_ocr": false}], "children": []}, "text": "16"}]}}] |